You've already forked libopenshot
mirror of
https://github.com/OpenShot/libopenshot.git
synced 2026-03-02 08:53:52 -08:00
Added CVObjectDetection and ObjectDetection effect
Also included kalman filter functions and code for tracking the output boxes from DNN model
This commit is contained in:
261
src/effects/ObjectDetection.cpp
Normal file
261
src/effects/ObjectDetection.cpp
Normal file
@@ -0,0 +1,261 @@
|
||||
/**
|
||||
* @file
|
||||
* @brief Source file for Object Detection effect class
|
||||
* @author Jonathan Thomas <jonathan@openshot.org>
|
||||
*
|
||||
* @ref License
|
||||
*/
|
||||
|
||||
/* LICENSE
|
||||
*
|
||||
* Copyright (c) 2008-2019 OpenShot Studios, LLC
|
||||
* <http://www.openshotstudios.com/>. This file is part of
|
||||
* OpenShot Library (libopenshot), an open-source project dedicated to
|
||||
* delivering high quality video editing and animation solutions to the
|
||||
* world. For more information visit <http://www.openshot.org/>.
|
||||
*
|
||||
* OpenShot Library (libopenshot) is free software: you can redistribute it
|
||||
* and/or modify it under the terms of the GNU Lesser General Public License
|
||||
* as published by the Free Software Foundation, either version 3 of the
|
||||
* License, or (at your option) any later version.
|
||||
*
|
||||
* OpenShot Library (libopenshot) is distributed in the hope that it will be
|
||||
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
* GNU Lesser General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU Lesser General Public License
|
||||
* along with OpenShot Library. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "../../include/effects/ObjectDetection.h"
|
||||
#include "../../include/effects/Tracker.h"
|
||||
|
||||
using namespace openshot;
|
||||
|
||||
/// Blank constructor, useful when using Json to load the effect properties
|
||||
ObjectDetection::ObjectDetection(std::string clipObDetectDataPath)
|
||||
{
|
||||
// Init effect properties
|
||||
init_effect_details();
|
||||
|
||||
// Tries to load the tracker data from protobuf
|
||||
LoadObjDetectdData(clipObDetectDataPath);
|
||||
}
|
||||
|
||||
// Default constructor
|
||||
ObjectDetection::ObjectDetection()
|
||||
{
|
||||
// Init effect properties
|
||||
init_effect_details();
|
||||
|
||||
}
|
||||
|
||||
// Init effect settings
|
||||
void ObjectDetection::init_effect_details()
|
||||
{
|
||||
/// Initialize the values of the EffectInfo struct.
|
||||
InitEffectInfo();
|
||||
|
||||
/// Set the effect info
|
||||
info.class_name = "Object Detector";
|
||||
info.name = "Object Detector";
|
||||
info.description = "Detect objects through the video.";
|
||||
info.has_audio = false;
|
||||
info.has_video = true;
|
||||
}
|
||||
|
||||
// This method is required for all derived classes of EffectBase, and returns a
|
||||
// modified openshot::Frame object
|
||||
std::shared_ptr<Frame> ObjectDetection::GetFrame(std::shared_ptr<Frame> frame, int64_t frame_number)
|
||||
{
|
||||
// Get the frame's image
|
||||
cv::Mat cv_image = frame->GetImageCV();
|
||||
|
||||
// Check if frame isn't NULL
|
||||
if(!cv_image.empty()){
|
||||
|
||||
// Check if track data exists for the requested frame
|
||||
if (detectionsData.find(frame_number) != detectionsData.end()) {
|
||||
|
||||
DetectionData detections = detectionsData[frame_number];
|
||||
for(int i = 0; i<detections.boxes.size(); i++){
|
||||
drawPred(detections.classIds.at(i), detections.confidences.at(i),
|
||||
detections.boxes.at(i), cv_image);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Set image with drawn box to frame
|
||||
// If the input image is NULL or doesn't have tracking data, it's returned as it came
|
||||
frame->SetImageCV(cv_image);
|
||||
|
||||
return frame;
|
||||
}
|
||||
|
||||
void ObjectDetection::drawPred(int classId, float conf, cv::Rect2d box, cv::Mat& frame)
|
||||
{
|
||||
//Draw a rectangle displaying the bounding box
|
||||
cv::rectangle(frame, box, cv::Scalar(255, 178, 50), 3);
|
||||
|
||||
//Get the label for the class name and its confidence
|
||||
std::string label = cv::format("%.2f", conf);
|
||||
if (!classNames.empty())
|
||||
{
|
||||
CV_Assert(classId < (int)classNames.size());
|
||||
label = classNames[classId] + ":" + label;
|
||||
}
|
||||
|
||||
//Display the label at the box.y of the bounding box
|
||||
int baseLine;
|
||||
cv::Size labelSize = getTextSize(label, cv::FONT_HERSHEY_SIMPLEX, 0.5, 1, &baseLine);
|
||||
box.y = std::max((int)box.y, labelSize.height);
|
||||
cv::rectangle(frame, cv::Point(box.x, box.y - round(1.5*labelSize.height)), cv::Point(box.x + round(1.5*labelSize.width), box.y + baseLine), cv::Scalar(255, 255, 255), cv::FILLED);
|
||||
putText(frame, label, cv::Point(box.x, box.y), cv::FONT_HERSHEY_SIMPLEX, 0.75, cv::Scalar(0,0,0),1);
|
||||
}
|
||||
|
||||
// Load protobuf data file
|
||||
bool ObjectDetection::LoadObjDetectdData(std::string inputFilePath){
|
||||
// Create tracker message
|
||||
libopenshotobjdetect::ObjDetect objMessage;
|
||||
|
||||
{
|
||||
// Read the existing tracker message.
|
||||
fstream input(inputFilePath, ios::in | ios::binary);
|
||||
if (!objMessage.ParseFromIstream(&input)) {
|
||||
cerr << "Failed to parse protobuf message." << endl;
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
// Make sure the trackedData is empty
|
||||
classNames.clear();
|
||||
detectionsData.clear();
|
||||
|
||||
for(int i = 0; i < objMessage.classnames_size(); i++){
|
||||
classNames.push_back(objMessage.classnames(i));
|
||||
}
|
||||
|
||||
// Iterate over all frames of the saved message
|
||||
for (size_t i = 0; i < objMessage.frame_size(); i++) {
|
||||
const libopenshotobjdetect::Frame& pbFrameData = objMessage.frame(i);
|
||||
|
||||
// Load frame and rotation data
|
||||
size_t id = pbFrameData.id();
|
||||
|
||||
// Load bounding box data
|
||||
const google::protobuf::RepeatedPtrField<libopenshotobjdetect::Frame_Box > &box = pbFrameData.bounding_box();
|
||||
|
||||
std::vector<int> classIds;
|
||||
std::vector<float> confidences;
|
||||
std::vector<cv::Rect> boxes;
|
||||
|
||||
for(int i = 0; i < pbFrameData.bounding_box_size(); i++){
|
||||
int x1 = box.at(i).x1();
|
||||
int y1 = box.at(i).y1();
|
||||
int x2 = box.at(i).x2();
|
||||
int y2 = box.at(i).y2();
|
||||
int classId = box.at(i).classid();
|
||||
float confidence = box.at(i).confidence();
|
||||
|
||||
cv::Rect2d box(x1, y1, x2-x1, y2-y1);
|
||||
|
||||
boxes.push_back(box);
|
||||
classIds.push_back(classId);
|
||||
confidences.push_back(confidence);
|
||||
}
|
||||
|
||||
// Assign data to tracker map
|
||||
detectionsData[id] = DetectionData(classIds, confidences, boxes, id);
|
||||
}
|
||||
|
||||
// Show the time stamp from the last update in tracker data file
|
||||
if (objMessage.has_last_updated()) {
|
||||
cout << " Loaded Data. Saved Time Stamp: " << TimeUtil::ToString(objMessage.last_updated()) << endl;
|
||||
}
|
||||
|
||||
// Delete all global objects allocated by libprotobuf.
|
||||
google::protobuf::ShutdownProtobufLibrary();
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
// Get tracker info for the desired frame
|
||||
DetectionData ObjectDetection::GetTrackedData(size_t frameId){
|
||||
|
||||
// Check if the tracker info for the requested frame exists
|
||||
if ( detectionsData.find(frameId) == detectionsData.end() ) {
|
||||
return DetectionData();
|
||||
} else {
|
||||
return detectionsData[frameId];
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
// Generate JSON string of this object
|
||||
std::string ObjectDetection::Json() const {
|
||||
|
||||
// Return formatted string
|
||||
return JsonValue().toStyledString();
|
||||
}
|
||||
|
||||
// Generate Json::Value for this object
|
||||
Json::Value ObjectDetection::JsonValue() const {
|
||||
|
||||
// Create root json object
|
||||
Json::Value root = EffectBase::JsonValue(); // get parent properties
|
||||
root["type"] = info.class_name;
|
||||
root["protobuf_data_path"] = protobuf_data_path;
|
||||
|
||||
// return JsonValue
|
||||
return root;
|
||||
}
|
||||
|
||||
// Load JSON string into this object
|
||||
void ObjectDetection::SetJson(const std::string value) {
|
||||
|
||||
// Parse JSON string into JSON objects
|
||||
try
|
||||
{
|
||||
const Json::Value root = openshot::stringToJson(value);
|
||||
// Set all values that match
|
||||
SetJsonValue(root);
|
||||
}
|
||||
catch (const std::exception& e)
|
||||
{
|
||||
// Error parsing JSON (or missing keys)
|
||||
throw InvalidJSON("JSON is invalid (missing keys or invalid data types)");
|
||||
}
|
||||
}
|
||||
|
||||
// Load Json::Value into this object
|
||||
void ObjectDetection::SetJsonValue(const Json::Value root) {
|
||||
|
||||
// Set parent data
|
||||
EffectBase::SetJsonValue(root);
|
||||
// Set data from Json (if key is found)
|
||||
if (!root["protobuf_data_path"].isNull()){
|
||||
protobuf_data_path = (root["protobuf_data_path"].asString());
|
||||
|
||||
if(!LoadObjDetectdData(protobuf_data_path)){
|
||||
std::cout<<"Invalid protobuf data path";
|
||||
protobuf_data_path = "";
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Get all properties for a specific frame
|
||||
std::string ObjectDetection::PropertiesJSON(int64_t requested_frame) const {
|
||||
|
||||
// Generate JSON properties list
|
||||
Json::Value root;
|
||||
root["id"] = add_property_json("ID", 0.0, "string", Id(), NULL, -1, -1, true, requested_frame);
|
||||
root["position"] = add_property_json("Position", Position(), "float", "", NULL, 0, 1000 * 60 * 30, false, requested_frame);
|
||||
root["layer"] = add_property_json("Track", Layer(), "int", "", NULL, 0, 20, false, requested_frame);
|
||||
root["start"] = add_property_json("Start", Start(), "float", "", NULL, 0, 1000 * 60 * 30, false, requested_frame);
|
||||
root["end"] = add_property_json("End", End(), "float", "", NULL, 0, 1000 * 60 * 30, false, requested_frame);
|
||||
root["duration"] = add_property_json("Duration", Duration(), "float", "", NULL, 0, 1000 * 60 * 30, true, requested_frame);
|
||||
|
||||
// Return formatted string
|
||||
return root.toStyledString();
|
||||
}
|
||||
Reference in New Issue
Block a user