hpc203
diff --git a/‎images/DSC_0410.JPG
382 KB b/‎images/DSC_0410.JPG
382 KB
diff --git a/‎images/DSC_0411.JPG
411 KB b/‎images/DSC_0411.JPG
411 KB
diff --git a/‎images/a.jpg
172 KB b/‎images/a.jpg
172 KB
diff --git a/‎images/b.jpg
209 KB b/‎images/b.jpg
209 KB
diff --git a/‎images/im_A.jpg
282 KB b/‎images/im_A.jpg
282 KB
diff --git a/‎images/im_B.jpg
1.08 MB b/‎images/im_B.jpg
1.08 MB
diff --git a/‎main.cpp
Lines changed: 162 additions & 0 deletions b/‎main.cpp
Lines changed: 162 additions & 0 deletions
diff --git a/‎main.py
Lines changed: 59 additions & 0 deletions b/‎main.py
Lines changed: 59 additions & 0 deletions
@@ -0,0 +1,162 @@
+#define _CRT_SECURE_NO_WARNINGS
+#include <iostream>
+#include <fstream>
+#include <string>
+
+#include <opencv2/imgproc.hpp>
+#include <opencv2/highgui.hpp>
+#include <opencv2/opencv.hpp> 
+#include <opencv2/features2d.hpp>
+
+//#include <cuda_provider_factory.h>
+#include <onnxruntime_cxx_api.h>
+
+using namespace cv;
+using namespace std;
+using namespace Ort;
+
+
+class DeDoDeRunner_end2end
+{
+public:
+	DeDoDeRunner_end2end(string model_path);
+	void detect(Mat image_a, Mat image_b, vector<cv::KeyPoint>& points_A, vector<cv::KeyPoint>& points_B);
+private:
+	const int inpWidth = 256;
+	const int inpHeight = 256;
+	const float mean_[3] = { 0.485, 0.456, 0.406 };
+	const float std_[3] = { 0.229, 0.224, 0.225 };
+	vector<float> input_images;
+	void preprocess(Mat image_a, Mat image_b);
+
+	Env env = Env(ORT_LOGGING_LEVEL_ERROR, "cv::KeyPoints detect and match");
+	Ort::Session* ort_session = nullptr;
+	SessionOptions sessionOptions = SessionOptions();
+	vector<char*> input_names;
+	vector<char*> output_names;
+	vector<vector<int64_t>> output_node_dims; // >=1 outputs
+};
+
+DeDoDeRunner_end2end::DeDoDeRunner_end2end(string model_path)
+{
+	std::wstring widestr = std::wstring(model_path.begin(), model_path.end());
+	//OrtStatus* status = OrtSessionOptionsAppendExecutionProvider_CUDA(sessionOptions, 0);
+	sessionOptions.SetGraphOptimizationLevel(ORT_ENABLE_BASIC);
+	ort_session = new Session(env, widestr.c_str(), sessionOptions);
+	size_t numInputNodes = ort_session->GetInputCount();
+	size_t numOutputNodes = ort_session->GetOutputCount();
+	AllocatorWithDefaultOptions allocator;
+	for (int i = 0; i < numInputNodes; i++)
+	{
+		input_names.push_back(ort_session->GetInputName(i, allocator));
+	}
+	for (int i = 0; i < numOutputNodes; i++)
+	{
+		output_names.push_back(ort_session->GetOutputName(i, allocator));
+		Ort::TypeInfo output_type_info = ort_session->GetOutputTypeInfo(i);
+		auto output_tensor_info = output_type_info.GetTensorTypeAndShapeInfo();
+		auto output_dims = output_tensor_info.GetShape();
+		output_node_dims.push_back(output_dims);
+	}
+}
+
+void DeDoDeRunner_end2end::preprocess(Mat image_a, Mat image_b)
+{
+	Mat dstimg;
+	cvtColor(image_a, dstimg, COLOR_BGR2RGB);
+	Size target_size = Size(this->inpWidth, this->inpHeight);
+	resize(dstimg, dstimg, target_size, INTER_LINEAR);
+	this->input_images.resize(2 * target_size.area() * 3);
+	for (int c = 0; c < 3; c++)
+	{
+		for (int i = 0; i < this->inpHeight; i++)
+		{
+			for (int j = 0; j < this->inpWidth; j++)
+			{
+				float pix = dstimg.ptr<uchar>(i)[j * 3 + c];
+				this->input_images[c * target_size.area() + i * this->inpWidth + j] = (pix / 255.0 - this->mean_[c]) / this->std_[c];
+			}
+		}
+	}
+
+	cvtColor(image_b, dstimg, COLOR_BGR2RGB);
+	resize(dstimg, dstimg, target_size, INTER_LINEAR);
+	for (int c = 0; c < 3; c++)
+	{
+		for (int i = 0; i < this->inpHeight; i++)
+		{
+			for (int j = 0; j < this->inpWidth; j++)
+			{
+				float pix = dstimg.ptr<uchar>(i)[j * 3 + c];
+				this->input_images[(3 + c) * target_size.area() + i * this->inpWidth + j] = (pix / 255.0 - this->mean_[c]) / this->std_[c];
+			}
+		}
+	}
+}
+
+
+void DeDoDeRunner_end2end::detect(Mat image_a, Mat image_b, vector<cv::KeyPoint>& points_A, vector<cv::KeyPoint>& points_B)
+{
+	this->preprocess(image_a, image_b);
+	array<int64_t, 4> input_shape_{ 2, 3, this->inpHeight, this->inpWidth };
+
+	auto allocator_info = MemoryInfo::CreateCpu(OrtDeviceAllocator, OrtMemTypeCPU);
+	Value input_tensor_ = Value::CreateTensor<float>(allocator_info, input_images.data(), input_images.size(), input_shape_.data(), input_shape_.size());
+
+	// 开始推理
+	vector<Value> ort_outputs = ort_session->Run(RunOptions{ nullptr }, &input_names[0], &input_tensor_, 1, output_names.data(), output_names.size());
+
+	///Postprocessing
+	const float* matches_A = ort_outputs[0].GetTensorMutableData<float>();
+	const float* matches_B = ort_outputs[1].GetTensorMutableData<float>();
+	int num_points = ort_outputs[0].GetTensorTypeAndShapeInfo().GetShape()[0];
+	///cout << "tensor total element = " << ort_outputs[0].GetTensorTypeAndShapeInfo().GetElementCount() << endl;
+	points_A.resize(num_points);
+	for (int i = 0; i < num_points; i++)
+	{
+		points_A[i].pt.x = (matches_A[i * 2] + 1) * 0.5 * image_a.cols;
+		points_A[i].pt.y = (matches_A[i * 2 + 1] + 1) * 0.5 * image_a.rows;
+		points_A[i].size = 1.f;
+	}
+
+	num_points = ort_outputs[1].GetTensorTypeAndShapeInfo().GetShape()[0];
+	points_B.resize(num_points);
+	for (int i = 0; i < num_points; i++)
+	{
+		points_B[i].pt.x = (matches_B[i * 2] + 1) * 0.5 * image_b.cols;
+		points_B[i].pt.y = (matches_B[i * 2 + 1] + 1) * 0.5 * image_b.rows;
+		points_B[i].size = 1.f;
+	}
+}
+
+int main()
+{
+	DeDoDeRunner_end2end mynet("weights/dedode_end2end_1024.onnx");
+	string imgpath_a = "images/im_A.jpg";
+	string imgpath_b = "images/im_B.jpg";
+	Mat image_a = imread(imgpath_a);
+	Mat image_b = imread(imgpath_b);
+
+	vector<cv::KeyPoint> points_A;
+	vector<cv::KeyPoint> points_B;
+	mynet.detect(image_a, image_b, points_A, points_B);
+
+	//匹配结果放在matches里面
+	const int num_points = points_A.size();
+	vector<DMatch> matches(num_points);
+	for (int i = 0; i < num_points; i++)
+	{
+		matches[i] = DMatch(i, i, 0.f);
+	}
+
+	//按照匹配关系将图画出来，背景图为match_img
+	Mat match_img;
+	drawMatches(image_a, points_A, image_b, points_B, matches, match_img);
+
+	//-- Show detected matches
+	static const string kWinName = "Image Matches in ONNXRuntime";
+	namedWindow(kWinName, WINDOW_NORMAL);
+	imshow(kWinName, match_img);
+	waitKey(0);
+	destroyAllWindows();
+}
@@ -0,0 +1,59 @@
+import numpy as np
+import onnxruntime as ort
+import cv2
+
+class DeDoDeRunner_end2end:
+    def __init__(self, end2end_path, img_size=[256, 256], fp16=False, providers=["CUDAExecutionProvider", "CPUExecutionProvider"]):
+        self.end2end = ort.InferenceSession(end2end_path, providers=providers)
+        self.mean_ = np.array([0.485, 0.456, 0.406], dtype=np.float32).reshape((1,1,3))
+        self.std_ = np.array([0.229, 0.224, 0.225], dtype=np.float32).reshape((1,1,3))
+        self.H, self.W = img_size
+        self.fp16 = fp16
+
+    def preprocess(self, image_a, image_b):
+        images = np.stack([cv2.resize(image_a, (self.W, self.H)), cv2.resize(image_b, (self.W, self.H))])
+        images = (images / 255.0 - self.mean_) / self.std_
+        return images.transpose(0, 3, 1, 2).astype(np.float32)
+
+    def detect(self, image_a, image_b):
+        H_A, W_A = image_a.shape[:2]
+        H_B, W_B = image_b.shape[:2]
+        images = self.preprocess(cv2.cvtColor(image_a, cv2.COLOR_BGR2RGB), cv2.cvtColor(image_b, cv2.COLOR_BGR2RGB))
+        if self.fp16:
+            images = images.astype(np.float16)
+        matches_A, matches_B, batch_ids = self.end2end.run(None, {"images": images})
+
+        # Postprocessing
+        matches_A = self.postprocess(matches_A, H_A, W_A)
+        matches_B = self.postprocess(matches_B, H_B, W_B)
+        return matches_A, matches_B
+
+    def postprocess(self, matches, H, W):
+        return (matches + 1) / 2 * [W, H]
+
+def draw_matches(im_A, kpts_A, im_B, kpts_B):
+    kpts_A = [cv2.KeyPoint(x, y, 1.0) for x, y in kpts_A]
+    kpts_B = [cv2.KeyPoint(x, y, 1.0) for x, y in kpts_B]
+    matches_A_to_B = [cv2.DMatch(idx, idx, 0.0) for idx in range(len(kpts_A))]
+    im_A, im_B = np.array(im_A), np.array(im_B)
+    ret = cv2.drawMatches(im_A, kpts_A, im_B, kpts_B, matches_A_to_B, None)
+    return ret
+
+if __name__ == "__main__":
+    img_paths = ["images/im_A.jpg", "images/im_B.jpg"]
+    mynet = DeDoDeRunner_end2end('weights/dedode_end2end_1024_fp16.onnx', fp16=True)
+
+    image_a, image_b = cv2.imread(img_paths[0]), cv2.imread(img_paths[1])
+    matches_a, matches_b = mynet.detect(image_a, image_b)
+
+    # match_img = np.hstack((image_a, image_b)) ###直接把两幅输入原图拼在一起,然后在点集里从0开始连线，是不行的。因为两幅输入原图的高宽并不是完全相同的，这就使得在两幅图里检测到的点集个数也可能不相等。因此不能直接连线的，要使用DMatch建立两个点集里的点间对应关系
+    # w = image_a.shape[1]
+    # for i in range(matches_a.shape[0]):
+    #     cv2.line(match_img, (int(matches_a[i,0]), int(matches_a[i,1])), (int(w+matches_b[i,0]), int(w+matches_b[i,1])), (0, 255, 0), lineType=16)
+
+    match_img = draw_matches(image_a, matches_a, image_b, matches_b)
+    print('image_a.shape =',image_a.shape, 'image_b.shape =',image_b.shape, 'match_img.shape =',match_img.shape)
+    cv2.namedWindow('Image matches use onnxrunime', cv2.WINDOW_NORMAL)
+    cv2.imshow("Image matches use onnxrunime", match_img)
+    cv2.waitKey(0)
+    cv2.destroyAllWindows()