/** * @file * @brief Source file for Object Detection effect class * @author Jonathan Thomas * * @ref License */ /* LICENSE * * Copyright (c) 2008-2019 OpenShot Studios, LLC * . This file is part of * OpenShot Library (libopenshot), an open-source project dedicated to * delivering high quality video editing and animation solutions to the * world. For more information visit . * * OpenShot Library (libopenshot) is free software: you can redistribute it * and/or modify it under the terms of the GNU Lesser General Public License * as published by the Free Software Foundation, either version 3 of the * License, or (at your option) any later version. * * OpenShot Library (libopenshot) is distributed in the hope that it will be * useful, but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with OpenShot Library. If not, see . */ #include "../../include/effects/ObjectDetection.h" #include "../../include/effects/Tracker.h" using namespace openshot; /// Blank constructor, useful when using Json to load the effect properties ObjectDetection::ObjectDetection(std::string clipObDetectDataPath) { // Init effect properties init_effect_details(); // Tries to load the tracker data from protobuf LoadObjDetectdData(clipObDetectDataPath); } // Default constructor ObjectDetection::ObjectDetection() { // Init effect properties init_effect_details(); } // Init effect settings void ObjectDetection::init_effect_details() { /// Initialize the values of the EffectInfo struct. InitEffectInfo(); /// Set the effect info info.class_name = "Object Detector"; info.name = "Object Detector"; info.description = "Detect objects through the video."; info.has_audio = false; info.has_video = true; } // This method is required for all derived classes of EffectBase, and returns a // modified openshot::Frame object std::shared_ptr ObjectDetection::GetFrame(std::shared_ptr frame, int64_t frame_number) { // Get the frame's image cv::Mat cv_image = frame->GetImageCV(); // Check if frame isn't NULL if(!cv_image.empty()){ // Check if track data exists for the requested frame if (detectionsData.find(frame_number) != detectionsData.end()) { DetectionData detections = detectionsData[frame_number]; for(int i = 0; iSetImageCV(cv_image); return frame; } void ObjectDetection::drawPred(int classId, float conf, cv::Rect2d box, cv::Mat& frame) { //Draw a rectangle displaying the bounding box cv::rectangle(frame, box, cv::Scalar(255, 178, 50), 3); //Get the label for the class name and its confidence std::string label = cv::format("%.2f", conf); if (!classNames.empty()) { CV_Assert(classId < (int)classNames.size()); label = classNames[classId] + ":" + label; } //Display the label at the box.y of the bounding box int baseLine; cv::Size labelSize = getTextSize(label, cv::FONT_HERSHEY_SIMPLEX, 0.5, 1, &baseLine); box.y = std::max((int)box.y, labelSize.height); cv::rectangle(frame, cv::Point(box.x, box.y - round(1.5*labelSize.height)), cv::Point(box.x + round(1.5*labelSize.width), box.y + baseLine), cv::Scalar(255, 255, 255), cv::FILLED); putText(frame, label, cv::Point(box.x, box.y), cv::FONT_HERSHEY_SIMPLEX, 0.75, cv::Scalar(0,0,0),1); } // Load protobuf data file bool ObjectDetection::LoadObjDetectdData(std::string inputFilePath){ // Create tracker message libopenshotobjdetect::ObjDetect objMessage; { // Read the existing tracker message. fstream input(inputFilePath, ios::in | ios::binary); if (!objMessage.ParseFromIstream(&input)) { cerr << "Failed to parse protobuf message." << endl; return false; } } // Make sure the trackedData is empty classNames.clear(); detectionsData.clear(); for(int i = 0; i < objMessage.classnames_size(); i++){ classNames.push_back(objMessage.classnames(i)); } // Iterate over all frames of the saved message for (size_t i = 0; i < objMessage.frame_size(); i++) { const libopenshotobjdetect::Frame& pbFrameData = objMessage.frame(i); // Load frame and rotation data size_t id = pbFrameData.id(); // Load bounding box data const google::protobuf::RepeatedPtrField &box = pbFrameData.bounding_box(); std::vector classIds; std::vector confidences; std::vector boxes; for(int i = 0; i < pbFrameData.bounding_box_size(); i++){ int x1 = box.at(i).x1(); int y1 = box.at(i).y1(); int x2 = box.at(i).x2(); int y2 = box.at(i).y2(); int classId = box.at(i).classid(); float confidence = box.at(i).confidence(); cv::Rect2d box(x1, y1, x2-x1, y2-y1); boxes.push_back(box); classIds.push_back(classId); confidences.push_back(confidence); } // Assign data to tracker map detectionsData[id] = DetectionData(classIds, confidences, boxes, id); } // Show the time stamp from the last update in tracker data file if (objMessage.has_last_updated()) { cout << " Loaded Data. Saved Time Stamp: " << TimeUtil::ToString(objMessage.last_updated()) << endl; } // Delete all global objects allocated by libprotobuf. google::protobuf::ShutdownProtobufLibrary(); return true; } // Get tracker info for the desired frame DetectionData ObjectDetection::GetTrackedData(size_t frameId){ // Check if the tracker info for the requested frame exists if ( detectionsData.find(frameId) == detectionsData.end() ) { return DetectionData(); } else { return detectionsData[frameId]; } } // Generate JSON string of this object std::string ObjectDetection::Json() const { // Return formatted string return JsonValue().toStyledString(); } // Generate Json::Value for this object Json::Value ObjectDetection::JsonValue() const { // Create root json object Json::Value root = EffectBase::JsonValue(); // get parent properties root["type"] = info.class_name; root["protobuf_data_path"] = protobuf_data_path; // return JsonValue return root; } // Load JSON string into this object void ObjectDetection::SetJson(const std::string value) { // Parse JSON string into JSON objects try { const Json::Value root = openshot::stringToJson(value); // Set all values that match SetJsonValue(root); } catch (const std::exception& e) { // Error parsing JSON (or missing keys) throw InvalidJSON("JSON is invalid (missing keys or invalid data types)"); } } // Load Json::Value into this object void ObjectDetection::SetJsonValue(const Json::Value root) { // Set parent data EffectBase::SetJsonValue(root); // Set data from Json (if key is found) if (!root["protobuf_data_path"].isNull()){ protobuf_data_path = (root["protobuf_data_path"].asString()); if(!LoadObjDetectdData(protobuf_data_path)){ std::cout<<"Invalid protobuf data path"; protobuf_data_path = ""; } } } // Get all properties for a specific frame std::string ObjectDetection::PropertiesJSON(int64_t requested_frame) const { // Generate JSON properties list Json::Value root; root["id"] = add_property_json("ID", 0.0, "string", Id(), NULL, -1, -1, true, requested_frame); root["position"] = add_property_json("Position", Position(), "float", "", NULL, 0, 1000 * 60 * 30, false, requested_frame); root["layer"] = add_property_json("Track", Layer(), "int", "", NULL, 0, 20, false, requested_frame); root["start"] = add_property_json("Start", Start(), "float", "", NULL, 0, 1000 * 60 * 30, false, requested_frame); root["end"] = add_property_json("End", End(), "float", "", NULL, 0, 1000 * 60 * 30, false, requested_frame); root["duration"] = add_property_json("Duration", Duration(), "float", "", NULL, 0, 1000 * 60 * 30, true, requested_frame); // Return formatted string return root.toStyledString(); }