1 год назад · 3fe67633cf
--- a/ReadMe.txt
+++ b/ReadMe.txt
@@ -23,4 +23,5 @@ v0.1.21
 
				 v0.1.22 切割模型标注关键点更改，2、3点分别是第一、二叶子分叉点
			
 
				 v0.1.23 抓取点以关键点4为基础偏移
			
 
				 v0.1.24 切割位置识别,增加kp3_weight_cut参数，控制抓取点在点3和点2间的位置，在[0,1.0]间，越大越靠近点3
			
 
				-v0.1.25 抓取功能扩展：增加是否空盘识别；增加叶尖朝向优先功能；增加单株优先功能；完善抓取接口返回数值定义
			
 
				+v0.1.25 抓取功能扩展：增加是否空盘识别；增加叶尖朝向优先功能；增加单株优先功能；完善抓取接口返回数值定义
			
 
				+v0.2.0 抓取优化，采用y8，opencv490
			
--- a/inference.cpp
+++ b/inference.cpp
@@ -47,6 +47,7 @@ std::vector<Detection> Inference::runInference(const cv::Mat &input)
 
				     std::vector<int> class_ids;
			
 
				     std::vector<float> confidences;
			
 
				     std::vector<cv::Rect> boxes;
			
 
				+	std::vector<std::vector<cv::Point>> kpts;
			
 
				 
			
 
				     for (int i = 0; i < rows; ++i)
			
 
				     {
			
@@ -76,6 +77,16 @@ std::vector<Detection> Inference::runInference(const cv::Mat &input)
 
				                 int width = int(w * x_factor);
			
 
				                 int height = int(h * y_factor);
			
 
				 
			
 
				+				int step = 3;
			
 
				+				std::vector<cv::Point> kps;
			
 
				+				for (int kpi = 0; kpi < 5; ++kpi) {
			
 
				+					float kp_x = data[5 + kpi * step];
			
 
				+					float kp_y = data[5 + kpi * step + 1];
			
 
				+					cv::Point kp(int(kp_x * x_factor), int(kp_y * y_factor));
			
 
				+					kps.push_back(kp);
			
 
				+				}
			
 
				+				kpts.push_back(kps);
			
 
				+
			
 
				                 boxes.push_back(cv::Rect(left, top, width, height));
			
 
				             }
			
 
				         }
			
@@ -138,6 +149,7 @@ std::vector<Detection> Inference::runInference(const cv::Mat &input)
 
				 
			
 
				         result.className = classes[result.class_id];
			
 
				         result.box = boxes[idx];
			
 
				+		result.kpts = kpts[idx];
			
 
				 
			
 
				         detections.push_back(result);
			
 
				     }
			
@@ -155,6 +167,7 @@ void Inference::loadClassesFromFile()
 
				             classes.push_back(classLine);
			
 
				         inputFile.close();
			
 
				     }
			
 
				+	classes.push_back(std::string("tea"));
			
 
				 }
			
 
				 
			
 
				 void Inference::loadOnnxNetwork()
			
--- a/inference.h
+++ b/inference.h
@@ -19,6 +19,7 @@ struct Detection
 
				     float confidence{0.0};
			
 
				     cv::Scalar color{};
			
 
				     cv::Rect box{};
			
 
				+	std::vector<cv::Point> kpts{};
			
 
				 };
			
 
				 
			
 
				 class Inference
			
@@ -26,7 +27,10 @@ class Inference
 
				 public:
			
 
				     Inference(const std::string &onnxModelPath, const cv::Size2f &modelInputShape, const std::string &classesTxtFile, const bool &runWithCuda = true);
			
 
				     std::vector<Detection> runInference(const cv::Mat &input);
			
 
				-
			
 
				+	
			
 
				+	void setModelConfidenseThreshold(float t) { modelConfidenseThreshold = t; };
			
 
				+	void setModelScoreThreshold(float t) { modelScoreThreshold = t; };
			
 
				+	void setModelNMSThreshold(float t) { modelNMSThreshold = t; }
			
 
				 private:
			
 
				     void loadClassesFromFile();
			
 
				     void loadOnnxNetwork();
			
--- a/tcv_conf.yml
+++ b/tcv_conf.yml
@@ -6,8 +6,8 @@ conf_parameters:
 
				    image_save: 1
			
 
				    image_depository: "D:\\logs\\algo_img"
			
 
				    image_backup_days: 7
			
 
				-   model_path_grab: "D:/projects/graft/py_code/retina_tea5/TeaDetector_grab_20231223061511.onnx"
			
 
				-   object_threshold_grab: 0.85
			
 
				+   model_path_grab: "D:/projects/graft/py_code/yolo8_tea/tea_grab/teagrab_20240108_2002/weights/best.onnx"
			
 
				+   object_threshold_grab: 0.65
			
 
				    nms_threshold_grab: 1.0000000149011612e-01
			
 
				    grid_row_grab: 2
			
 
				    grid_col_grab: 3
			
@@ -17,7 +17,8 @@ conf_parameters:
 
				    min_area_ratio_grab: 0.0
			
 
				    max_area_ratio_grab: 0.12
			
 
				    rot_degree_grab: 0
			
 
				-   model_path_cut: "D:/projects/graft/py_code/retina_tea5/TeaDetector_cut_20231219003541.onnx"
			
 
				+   # model_path_cut: "D:/projects/graft/py_code/retina_tea5/TeaDetector_cut_20231219003541.onnx"
			
 
				+   model_path_cut: "D:/projects/graft/py_code/yolo8_tea/tea_cut/teacut_20240106_200/weights/best.onnx"
			
 
				    object_threshold_cut: 0.8
			
 
				    nms_threshold_cut: 0.1
			
 
				    grid_row_cut: 1
			
--- a/tea_cv_api.cpp
+++ b/tea_cv_api.cpp
@@ -18,7 +18,7 @@ extern CRITICAL_SECTION g_cs;
 
				 namespace graft_cv
			
 
				 {
			
 
				 
			
 
				-	char *g_version_str = "0.1.25";
			
 
				+	char *g_version_str = "0.2.0";
			
 
				 
			
 
				 	//configure
			
 
				 	string g_conf_file = "./tcv_conf.yml";	
			
--- a/tea_detect.cpp
+++ b/tea_detect.cpp
@@ -281,9 +281,10 @@ namespace graft_cv {
 
				 	//////////////////////////////////////////////////////////////////////////////////
			
 
				 	//////////////////////////////////////////////////////////////////////////////////
			
 
				 	YoloDrop::YoloDrop(CGcvLogger* pLogger, float obj_th, float nms_th)
			
 
				-		:m_model_loaded(false)
			
 
				+		:m_model_loaded(false),
			
 
				+		m_pInfer(0),
			
 
				+		m_runWithCuda(false)
			
 
				 	{
			
 
				-		m_infer = Inference(const std::string &onnxModelPath, const cv::Size2f &modelInputShape, const std::string &classesTxtFile, const bool &runWithCuda = true);
			
 
				 		BATCH_SIZE = 1;
			
 
				 		INPUT_CHANNEL = 3;
			
 
				 		IMAGE_WIDTH = 640; // default 640
			
@@ -307,7 +308,7 @@ namespace graft_cv {
 
				 		m_feature_steps = { 8,16,32 };
			
 
				 		m_pLogger = pLogger;
			
 
				 
			
 
				-		for (const int step : m_feature_steps) {
			
 
				+		/*for (const int step : m_feature_steps) {
			
 
				 			assert(step != 0);
			
 
				 			int feature_map = IMAGE_HEIGHT / step;
			
 
				 			m_feature_maps.push_back(feature_map);
			
@@ -316,7 +317,7 @@ namespace graft_cv {
 
				 		}
			
 
				 		m_anchor_sizes = { { 16,32 } ,{ 64,128 },{ 256, 512 } };
			
 
				 		m_sum_of_feature = std::accumulate(m_feature_sizes.begin(), m_feature_sizes.end(), 0) * m_anchor_num;
			
 
				-		generate_anchors();
			
 
				+		generate_anchors();*/
			
 
				 		if (m_pLogger) {
			
 
				 			m_pLogger->INFO(string("YoloDrop object initialized"));
			
 
				 		}
			
@@ -331,15 +332,33 @@ namespace graft_cv {
 
				 	{
			
 
				 		this->m_obj_threshold = object_threshold;
			
 
				 		this->m_nms_threshold = nms_threshold;
			
 
				+		if (m_pInfer) {
			
 
				+			m_pInfer->setModelNMSThreshold(m_nms_threshold);
			
 
				+			m_pInfer->setModelScoreThreshold(m_obj_threshold);
			
 
				+		}
			
 
				 	}
			
 
				 
			
 
				 	bool YoloDrop::LoadModel(std::string onnx_path) {
			
 
				+		if (m_pInfer) {
			
 
				+			delete m_pInfer;
			
 
				+			m_pInfer = 0;
			
 
				+			m_model_loaded = false;
			
 
				+
			
 
				+		}		
			
 
				+		cv::Size2f modelInputShape((float)IMAGE_WIDTH, (float)IMAGE_HEIGHT);		
			
 
				+		
			
 
				 		if (m_pLogger) {
			
 
				 			m_pLogger->INFO(string("Loading detection model: ") + onnx_path);
			
 
				 		}
			
 
				 		else { std::cout << "Loading detection model: " << onnx_path << std::endl; }
			
 
				 		try {
			
 
				-			m_model = cv::dnn::readNetFromONNX(onnx_path);
			
 
				+			m_pInfer = new Inference(onnx_path, modelInputShape, "", m_runWithCuda);
			
 
				+			if (!m_pInfer) {
			
 
				+				throw(string("inference init error"));
			
 
				+			}
			
 
				+			m_pInfer->setModelNMSThreshold(m_nms_threshold);
			
 
				+			m_pInfer->setModelScoreThreshold(m_obj_threshold);
			
 
				+
			
 
				 			if (m_pLogger) { m_pLogger->INFO(string("Detection model loaded")); }
			
 
				 			m_model_loaded = true;
			
 
				 			return m_model_loaded;
			
@@ -351,10 +370,10 @@ namespace graft_cv {
 
				 		return false;
			
 
				 	}
			
 
				 
			
 
				-	std::vector<Bbox> YoloDrop::RunModel(cv::Mat& img, CGcvLogger* pInstanceLogger)
			
 
				+	std::vector<Bbox> YoloDrop::RunModel(cv::Mat& frame, CGcvLogger* pInstanceLogger)
			
 
				 	{
			
 
				 		std::vector<Bbox> result;
			
 
				-		if (img.empty()) {
			
 
				+		if (frame.empty()) {
			
 
				 			if (pInstanceLogger) {
			
 
				 				pInstanceLogger->ERRORINFO(string("RunModel(), input image is empty"));
			
 
				 			}
			
@@ -362,51 +381,76 @@ namespace graft_cv {
 
				 		}
			
 
				 		if (!m_model_loaded) {
			
 
				 			pInstanceLogger->ERRORINFO(string("model is NOT loaded"));
			
 
				+			throw(string("model is NOT loaded"));
			
 
				 		}
			
 
				-		cv::Mat blob = cv::dnn::blobFromImage(
			
 
				-			img,
			
 
				-			1.0,
			
 
				-			m_size_detection,
			
 
				-			m_img_mean);
			
 
				-		m_model.setInput(blob);
			
 
				 
			
 
				-		std::vector<std::string> outNames = m_model.getUnconnectedOutLayersNames();
			
 
				-		vector<Mat>outputs;// location(1x16800x4), confidence(1x16800x2), keypoint(1x16800x2)
			
 
				-		if (pInstanceLogger) {
			
 
				-			pInstanceLogger->INFO(string("RunModel(), before forward()"));
			
 
				-		}
			
 
				-		m_model.forward(outputs, outNames);
			
 
				-		std::vector<YoloDrop::DropRes> rects;
			
 
				-		int n = post_process(img, outputs, rects);
			
 
				-		for (const auto& rect : rects) {
			
 
				-			Bbox box;
			
 
				-			box.score = rect.confidence;
			
 
				-			box.x1 = (int)rect.drop_box.x1;
			
 
				-			box.y1 = (int)rect.drop_box.y1;
			
 
				-			box.x2 = (int)rect.drop_box.x2;
			
 
				-			box.y2 = (int)rect.drop_box.y2;
			
 
				-			box.ppoint[0] = rect.keypoints[0].x;
			
 
				-			box.ppoint[1] = rect.keypoints[0].y;
			
 
				-			box.ppoint[2] = rect.keypoints[1].x;
			
 
				-			box.ppoint[3] = rect.keypoints[1].y;
			
 
				-			box.ppoint[4] = rect.keypoints[2].x;
			
 
				-			box.ppoint[5] = rect.keypoints[2].y;
			
 
				-			box.ppoint[6] = rect.keypoints[3].x;
			
 
				-			box.ppoint[7] = rect.keypoints[3].y;
			
 
				-			box.ppoint[8] = rect.keypoints[4].x;
			
 
				-			box.ppoint[9] = rect.keypoints[4].y;
			
 
				+		// Inference starts here...
			
 
				+		std::vector<Detection> output = m_pInfer->runInference(frame);
			
 
				 
			
 
				-			box.operate_point[0] = 0.0;
			
 
				-			box.operate_point[1] = 0.0;
			
 
				-			box.operate_angle = 0.0;
			
 
				+		int detections = output.size();
			
 
				+		std::cout << "Number of detections:" << detections << std::endl;
			
 
				 
			
 
				-			box.area = 0.0;
			
 
				-			box.status = 0;
			
 
				-			result.push_back(box);
			
 
				+		for (int i = 0; i < detections; ++i)
			
 
				+		{
			
 
				+			Detection detection = output[i];
			
 
				+
			
 
				+			cv::Rect box = detection.box;
			
 
				+			cv::Scalar color = detection.color;
			
 
				+			std::vector<cv::Point> pts = detection.kpts;
			
 
				+
			
 
				+			Bbox box_out;
			
 
				+			box_out.score = detection.confidence;
			
 
				+			box_out.x1 = box.x;
			
 
				+			box_out.y1 = box.y;
			
 
				+			box_out.x2 = box.x + box.width;
			
 
				+			box_out.y2 = box.y + box.height;
			
 
				+			box_out.ppoint[0] = pts[0].x;
			
 
				+			box_out.ppoint[1] = pts[0].y;
			
 
				+			box_out.ppoint[2] = pts[1].x;
			
 
				+			box_out.ppoint[3] = pts[1].y;
			
 
				+			box_out.ppoint[4] = pts[2].x;
			
 
				+			box_out.ppoint[5] = pts[2].y;
			
 
				+			box_out.ppoint[6] = pts[3].x;
			
 
				+			box_out.ppoint[7] = pts[3].y;
			
 
				+			box_out.ppoint[8] = pts[4].x;
			
 
				+			box_out.ppoint[9] = pts[4].y;
			
 
				+
			
 
				+			box_out.operate_point[0] = 0.0;
			
 
				+			box_out.operate_point[1] = 0.0;
			
 
				+			box_out.operate_angle = 0.0;
			
 
				+
			
 
				+			box_out.area = 0.0;
			
 
				+			box_out.status = 0;
			
 
				+			result.push_back(box_out);
			
 
				+
			
 
				+
			
 
				+			//// Detection box
			
 
				+			//cv::rectangle(frame, box, color, 2);
			
 
				+
			
 
				+			//// Detection box text
			
 
				+			//std::string classString = detection.className + ' ' + std::to_string(detection.confidence).substr(0, 4);
			
 
				+			//cv::Size textSize = cv::getTextSize(classString, cv::FONT_HERSHEY_DUPLEX, 1, 2, 0);
			
 
				+			//cv::Rect textBox(box.x, box.y - 40, textSize.width + 10, textSize.height + 20);
			
 
				+
			
 
				+			//cv::rectangle(frame, textBox, color, cv::FILLED);
			
 
				+			//cv::putText(frame, classString, cv::Point(box.x + 5, box.y - 10), cv::FONT_HERSHEY_DUPLEX, 1, cv::Scalar(0, 0, 0), 2, 0);
			
 
				+
			
 
				+			//for (auto& pt : pts) {
			
 
				+			//	cv::circle(frame, pt, 3, cv::Scalar(0, 0, 255));
			
 
				+			//}
			
 
				 		}
			
 
				+		// Inference ends here...
			
 
				+
			
 
				+		// This is only for preview purposes
			
 
				+		/*float scale = 0.8;
			
 
				+		cv::resize(frame, frame, cv::Size(frame.cols*scale, frame.rows*scale));
			
 
				+		cv::imshow("Inference", frame);
			
 
				+
			
 
				+		cv::waitKey(-1);*/
			
 
				+		
			
 
				 		if (pInstanceLogger) {
			
 
				 			stringstream buff;
			
 
				-			buff << "detected object: " << n;
			
 
				+			buff << "detected object: " << detections;
			
 
				 			pInstanceLogger->INFO(buff.str());
			
 
				 		}
			
 
				 		return result;
			
--- a/tea_detect.h
+++ b/tea_detect.h
@@ -97,7 +97,8 @@ namespace graft_cv {
 
				 		void SetThreshold(float object_threshold, float nms_threshold);
			
 
				 
			
 
				 	private:
			
 
				-		Inference m_infer;
			
 
				+		Inference* m_pInfer;
			
 
				+		bool m_runWithCuda;
			
 
				 		void generate_anchors();
			
 
				 		int post_process(
			
 
				 			cv::Mat &vec_Mat,
			
--- a/tea_sorter.cpp
+++ b/tea_sorter.cpp
@@ -1679,42 +1679,102 @@ double CTeaSort::singleten_ratio(
 
				 Bbox& box
			
 
				 )
			
 
				 {
			
 
				-	//计算图片中背景的占有率
			
 
				-	//padding
			
 
				-	//扩展box的范围，4个方向全部扩展
			
 
				-	int x1 = box.x1;
			
 
				-	int y1 = box.y1;
			
 
				-	int x2 = box.x2;
			
 
				-	int y2 = box.y2;
			
 
				+	//计算苗的方向，找到抓取的位置
			
 
				+	float x3 = box.ppoint[4];
			
 
				+	float y3 = box.ppoint[5];
			
 
				+	float x5 = box.ppoint[8];
			
 
				+	float y5 = box.ppoint[9];
			
 
				+	double angle = atan2(x5 - x3, y5 - y3);
			
 
				+
			
 
				 	int padding_border = m_cp.offset_grab;
			
 
				-	x1 -= padding_border;
			
 
				+
			
 
				+	float grab_x = x3 + (float)padding_border * sin(angle);
			
 
				+	float grab_y = y3 + (float)padding_border * cos(angle);
			
 
				+
			
 
				+	double singleten_ratio = 0.0;
			
 
				+	if (grab_x < 0 || grab_y <0 || grab_x> m_raw_img.cols - 1 || grab_y >m_raw_img.rows - 1) {
			
 
				+		return singleten_ratio;
			
 
				+	}
			
 
				+
			
 
				+	int x1 = int(grab_x) - padding_border / 2;
			
 
				+	int y1 = int(grab_y) - padding_border / 2;
			
 
				+	int x2 = x1 + padding_border;
			
 
				+	int y2 = y1 + padding_border;
			
 
				+
			
 
				 	x1 = x1 < 0 ? 0 : x1;
			
 
				-	y1 -= padding_border;
			
 
				 	y1 = y1 < 0 ? 0 : y1;
			
 
				-
			
 
				-	x2 += padding_border;
			
 
				 	x2 = x2 < m_raw_img.cols ? x2 : m_raw_img.cols - 1;
			
 
				-
			
 
				-	y2 += padding_border;
			
 
				 	y2 = y2 < m_raw_img.rows ? y2 : m_raw_img.rows - 1;
			
 
				-	
			
 
				-	cv::Rect r(x1,y1,x2-x1,y2-y1);
			
 
				-	
			
 
				+
			
 
				+	cv::Rect r(x1, y1, x2 - x1, y2 - y1);
			
 
				+
			
 
				+	//debug
			
 
				+	if (m_cp.image_show) {
			
 
				+		cv::Mat tmp = m_raw_img.clone();
			
 
				+		cv::Rect br(box.x1, box.y1, box.x2 - box.x1, box.y2 - box.y1);
			
 
				+		cv::rectangle(tmp, br, cv::Scalar(0, 0, 200), 2);
			
 
				+		cv::rectangle(tmp, r, cv::Scalar(0, 100, 0), 2);
			
 
				+		imshow_wait("box", tmp);
			
 
				+	}
			
 
				+
			
 
				 	cv::Mat roi = m_raw_gray_img(r).clone();
			
 
				 	cv::Mat bin_img;
			
 
				 	double th = cv::threshold(roi, bin_img, 255, 255, cv::THRESH_OTSU);
			
 
				-	
			
 
				+
			
 
				+	if (m_cp.image_show) {
			
 
				+		imshow_wait("box bin_img", bin_img);
			
 
				+	}
			
 
				+
			
 
				+
			
 
				 	//统计bin_img中非0个数
			
 
				 	double bg_area = 0;
			
 
				 	cv::Mat_<uchar>::iterator it = bin_img.begin<uchar>();
			
 
				 	cv::Mat_<uchar>::iterator it_end = bin_img.end<uchar>();
			
 
				-	for(;it!=it_end;++it){
			
 
				-		if((*it)>0){
			
 
				-			bg_area+=1;
			
 
				+	for (; it != it_end; ++it) {
			
 
				+		if ((*it)>0) {
			
 
				+			bg_area += 1;
			
 
				 		}
			
 
				 	}
			
 
				-	double singleten_ratio = bg_area / static_cast<double>(roi.cols * roi.rows);
			
 
				-	return singleten_ratio;	
			
 
				+	singleten_ratio = bg_area / static_cast<double>(roi.cols * roi.rows);
			
 
				+	return singleten_ratio;
			
 
				+
			
 
				+
			
 
				+	////计算图片中背景的占有率
			
 
				+	////padding
			
 
				+	////扩展box的范围，4个方向全部扩展
			
 
				+	//int x1 = box.x1;
			
 
				+	//int y1 = box.y1;
			
 
				+	//int x2 = box.x2;
			
 
				+	//int y2 = box.y2;
			
 
				+	//int padding_border = m_cp.offset_grab;
			
 
				+	//x1 -= padding_border;
			
 
				+	//x1 = x1 < 0 ? 0 : x1;
			
 
				+	//y1 -= padding_border;
			
 
				+	//y1 = y1 < 0 ? 0 : y1;
			
 
				+
			
 
				+	//x2 += padding_border;
			
 
				+	//x2 = x2 < m_raw_img.cols ? x2 : m_raw_img.cols - 1;
			
 
				+
			
 
				+	//y2 += padding_border;
			
 
				+	//y2 = y2 < m_raw_img.rows ? y2 : m_raw_img.rows - 1;
			
 
				+	//
			
 
				+	//cv::Rect r(x1,y1,x2-x1,y2-y1);
			
 
				+	//
			
 
				+	//cv::Mat roi = m_raw_gray_img(r).clone();
			
 
				+	//cv::Mat bin_img;
			
 
				+	//double th = cv::threshold(roi, bin_img, 255, 255, cv::THRESH_OTSU);
			
 
				+	//
			
 
				+	////统计bin_img中非0个数
			
 
				+	//double bg_area = 0;
			
 
				+	//cv::Mat_<uchar>::iterator it = bin_img.begin<uchar>();
			
 
				+	//cv::Mat_<uchar>::iterator it_end = bin_img.end<uchar>();
			
 
				+	//for(;it!=it_end;++it){
			
 
				+	//	if((*it)>0){
			
 
				+	//		bg_area+=1;
			
 
				+	//	}
			
 
				+	//}
			
 
				+	//double singleten_ratio = bg_area / static_cast<double>(roi.cols * roi.rows);
			
 
				+	//return singleten_ratio;	
			
 
				 }
			
 
				 double CTeaSort::direction_ratio(
			
 
				 	Bbox& box