Add files via upload

hpc203 · web-flow · commit f29da2f0bdff · 2023-07-30T18:10:07.000+08:00
diff --git a/input.png b/input.png
diff --git a/main.cpp b/main.cpp
@@ -0,0 +1,150 @@
+#define _CRT_SECURE_NO_WARNINGS
+#include <iostream>
+#include <fstream>
+#include <numeric>
+#include <opencv2/imgproc.hpp>
+#include <opencv2/highgui.hpp>
+//#include <cuda_provider_factory.h>  ///nvidia-cuda����
+#include <onnxruntime_cxx_api.h>
+
+using namespace cv;
+using namespace std;
+using namespace Ort;
+
+class CodeFormer
+{
+public:
+	CodeFormer(string modelpath);
+	Mat detect(Mat cv_image);
+private:
+	void preprocess(Mat srcimg);
+	vector<float> input_image_;
+	vector<double> input2_tensor;
+	int inpWidth;
+	int inpHeight;
+	int outWidth;
+	int outHeight;
+	
+	float min_max[2] = { -1,1 };
+
+	//�洢��ʼ����õĿ�ִ������
+	Env env = Env(ORT_LOGGING_LEVEL_ERROR, "CodeFormer");
+	Ort::Session *ort_session = nullptr;
+	SessionOptions sessionOptions = SessionOptions();
+	vector<char*> input_names;
+	vector<char*> output_names;
+	vector<vector<int64_t>> input_node_dims; // >=1 outputs
+	vector<vector<int64_t>> output_node_dims; // >=1 outputs
+};
+
+CodeFormer::CodeFormer(string model_path)
+{
+	//OrtStatus* status = OrtSessionOptionsAppendExecutionProvider_CUDA(sessionOptions, 0);  ///nvidia-cuda����
+	sessionOptions.SetGraphOptimizationLevel(ORT_ENABLE_BASIC);
+	std::wstring widestr = std::wstring(model_path.begin(), model_path.end());   ///�����windowsϵͳ����ôд
+	ort_session = new Session(env, widestr.c_str(), sessionOptions);   ///�����windowsϵͳ����ôд
+	///ort_session = new Session(env, model_path.c_str(), sessionOptions);  ///�����linuxϵͳ������ôд
+
+	size_t numInputNodes = ort_session->GetInputCount();
+	size_t numOutputNodes = ort_session->GetOutputCount();
+	AllocatorWithDefaultOptions allocator;
+	for (int i = 0; i < numInputNodes; i++)
+	{
+		input_names.push_back(ort_session->GetInputName(i, allocator));
+		Ort::TypeInfo input_type_info = ort_session->GetInputTypeInfo(i);
+		auto input_tensor_info = input_type_info.GetTensorTypeAndShapeInfo();
+		auto input_dims = input_tensor_info.GetShape();
+		input_node_dims.push_back(input_dims);
+	}
+	for (int i = 0; i < numOutputNodes; i++)
+	{
+		output_names.push_back(ort_session->GetOutputName(i, allocator));
+		Ort::TypeInfo output_type_info = ort_session->GetOutputTypeInfo(i);
+		auto output_tensor_info = output_type_info.GetTensorTypeAndShapeInfo();
+		auto output_dims = output_tensor_info.GetShape();
+		output_node_dims.push_back(output_dims);
+	}
+
+	this->inpHeight = input_node_dims[0][2];
+	this->inpWidth = input_node_dims[0][3];
+	this->outHeight = output_node_dims[0][2];
+	this->outWidth = output_node_dims[0][3];
+	input2_tensor.push_back(0.5);
+}
+
+void CodeFormer::preprocess(Mat srcimg)
+{
+	Mat dstimg;
+	cvtColor(srcimg, dstimg, COLOR_BGR2RGB);
+	resize(dstimg, dstimg, Size(this->inpWidth, this->inpHeight), INTER_LINEAR);
+	this->input_image_.resize(this->inpWidth * this->inpHeight * dstimg.channels());
+	int k = 0;
+	for (int c = 0; c < 3; c++)
+	{
+		for (int i = 0; i < this->inpHeight; i++)
+		{
+			for (int j = 0; j < this->inpWidth; j++)
+			{
+				float pix = dstimg.ptr<uchar>(i)[j * 3 + c];
+				this->input_image_[k] = (pix / 255.0 - 0.5) / 0.5;
+				k++;
+			}
+		}
+	}
+}
+
+Mat CodeFormer::detect(Mat srcimg)
+{
+	int im_h = srcimg.rows;
+	int im_w = srcimg.cols;
+	this->preprocess(srcimg);
+	array<int64_t, 4> input_shape_{ 1, 3, this->inpHeight, this->inpWidth };
+	vector<int64_t> input2_shape_ = { 1 };
+
+	auto allocator_info = MemoryInfo::CreateCpu(OrtDeviceAllocator, OrtMemTypeCPU);
+	vector<Value> ort_inputs;
+	ort_inputs.push_back(Value::CreateTensor<float>(allocator_info, input_image_.data(), input_image_.size(), input_shape_.data(), input_shape_.size()));
+	ort_inputs.push_back(Value::CreateTensor<double>(allocator_info, input2_tensor.data(), input2_tensor.size(), input2_shape_.data(), input2_shape_.size()));
+	vector<Value> ort_outputs = ort_session->Run(RunOptions{ nullptr }, input_names.data(), ort_inputs.data(), ort_inputs.size(), output_names.data(), output_names.size());
+	
+	////post_process
+	float* pred = ort_outputs[0].GetTensorMutableData<float>();
+	//////Mat mask(outHeight, outWidth, CV_32FC3, pred); /////��������,ֱ��������ֵ,�ǲ��е�
+	const unsigned int channel_step = outHeight * outWidth;
+	vector<Mat> channel_mats;
+	Mat rmat(outHeight, outWidth, CV_32FC1, pred); // R
+	Mat gmat(outHeight, outWidth, CV_32FC1, pred + channel_step); // G
+	Mat bmat(outHeight, outWidth, CV_32FC1, pred + 2 * channel_step); // B
+	channel_mats.push_back(rmat);
+	channel_mats.push_back(gmat);
+	channel_mats.push_back(bmat);
+	Mat mask;
+	merge(channel_mats, mask); // CV_32FC3 allocated
+
+	///����forѭ������Mat���ÿ������ֵ,ʵ��numpy.clip����
+	mask.setTo(this->min_max[0], mask < this->min_max[0]);
+	mask.setTo(this->min_max[1], mask > this->min_max[1]);   ////Ҳ������threshold����,��ֵ����THRESH_TOZERO_INV
+
+	mask = (mask - this->min_max[0]) / (this->min_max[1] - this->min_max[0]);
+	mask *= 255.0;
+	mask.convertTo(mask, CV_8UC3);
+	cvtColor(mask, mask, COLOR_BGR2RGB);
+	return mask;
+}
+
+int main()
+{
+	CodeFormer mynet("codeformer.onnx");
+	string imgpath = "input.png";
+	Mat srcimg = imread(imgpath);
+	Mat dstimg = mynet.detect(srcimg);
+	resize(dstimg, dstimg, Size(srcimg.cols, srcimg.rows), INTER_LINEAR);
+	
+	//imwrite("result.jpg", dstimg)
+	namedWindow("srcimg", WINDOW_NORMAL);
+	imshow("srcimg", srcimg);
+	namedWindow("dstimg", WINDOW_NORMAL);
+	imshow("dstimg", dstimg);
+	waitKey(0);
+	destroyAllWindows();
+}
diff --git a/main.py b/main.py
@@ -0,0 +1,80 @@
+import argparse
+import cv2
+import numpy as np
+import onnxruntime as ort
+
+
+class CodeFormer():
+    def __init__(self, modelpath):
+        # net = cv2.dnn.readNet(modelpath)
+        so = ort.SessionOptions()
+        so.log_severity_level = 3
+        self.session = ort.InferenceSession(modelpath, so)
+        model_inputs = self.session.get_inputs()
+        self.input_name0 = model_inputs[0].name
+        self.input_name1 = model_inputs[1].name
+        self.inpheight = model_inputs[0].shape[2]
+        self.inpwidth = model_inputs[0].shape[3]
+
+    def post_processing(self, tensor, rgb2bgr=True, out_type=np.uint8, min_max=(0, 1)):
+        # tensor 3ch
+        _tensor = tensor[0]
+
+        _tensor = _tensor.clip(min_max[0], min_max[1])
+
+        _tensor = (_tensor - min_max[0]) / (min_max[1] - min_max[0])
+
+        n_dim = _tensor.ndim
+
+        if n_dim == 3:
+            img_np = _tensor
+            img_np = img_np.transpose(1, 2, 0)
+            if img_np.shape[2] == 1:  # gray image
+                img_np = np.squeeze(img_np, axis=2)
+            else:
+                if rgb2bgr:
+                    img_np = cv2.cvtColor(img_np, cv2.COLOR_RGB2BGR)
+        elif n_dim == 2:
+            img_np = _tensor
+        else:
+            raise TypeError('Only support 4D, 3D or 2D tensor. ' f'But received with dimension: {n_dim}')
+        if out_type == np.uint8:
+            # Unlike MATLAB, numpy.unit8() WILL NOT round by default.
+            img_np = (img_np * 255.0).round()
+        img_np = img_np.astype(out_type)
+        return img_np
+
+    def detect(self, srcimg):
+        dstimg = cv2.cvtColor(srcimg, cv2.COLOR_BGR2RGB)
+        dstimg = cv2.resize(dstimg, (self.inpwidth, self.inpheight), interpolation=cv2.INTER_LINEAR)
+        dstimg = (dstimg.astype(np.float32)/255.0 - 0.5) / 0.5
+        input_image = np.expand_dims(dstimg.transpose(2, 0, 1), axis=0).astype(np.float32)
+
+        # Inference
+        output = self.session.run(None, {self.input_name0: input_image, self.input_name1:np.array([0.5])})[0]
+        restored_img = self.post_processing(output, rgb2bgr=True, min_max=(-1, 1))
+        return restored_img.astype('uint8')
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--imgpath", type=str, default='input.png', help="image path")
+    parser.add_argument("--modelpath", type=str, default='codeformer.onnx', help="onnxmodel path")
+    args = parser.parse_args()
+
+    mynet = CodeFormer(args.modelpath)
+    srcimg = cv2.imread(args.imgpath)
+    restored_img = mynet.detect(srcimg)
+    restored_img = cv2.resize(restored_img, (srcimg.shape[1], srcimg.shape[0]), interpolation=cv2.INTER_LINEAR)
+
+    # if srcimg.shape[0]>=srcimg.shape[1]:
+    #     result = np.vstack((srcimg, restored_img))
+    # else:
+    #     result = np.hstack((srcimg, restored_img))
+
+    # cv2.imwrite('result.jpg', restored_img)
+    cv2.namedWindow("srcimg", cv2.WINDOW_NORMAL)
+    cv2.imshow("srcimg", srcimg)
+    cv2.namedWindow("restored_img", cv2.WINDOW_NORMAL)
+    cv2.imshow("restored_img", restored_img)
+    cv2.waitKey(0)
+    cv2.destroyAllWindows()