dkurt · August 6, 2024 07:32 · mczhao1977 · Aug 1, 2024
diff --git a/CMakeLists.txt b/CMakeLists.txt
 cmake_minimum_required(VERSION 3.4.3)

 project(sample CXX)

 find_package(InferenceEngine REQUIRED)

 add_executable(${CMAKE_PROJECT_NAME} main.cpp)
 target_compile_features(${CMAKE_PROJECT_NAME} PRIVATE cxx_range_for)

 target_link_libraries(${CMAKE_PROJECT_NAME}
  ${InferenceEngine_LIBRARIES}
  pthread
 )
diff --git a/main.cpp b/main.cpp
 #include <queue>
 #include <mutex>
 #include <thread>
 #include <sys/time.h>
 #include <condition_variable>

 #include <inference_engine.hpp>

 using namespace InferenceEngine;

 class OpenVINOLauncher {
 public:
    OpenVINOLauncher(const std::string& xmlPath, const std::string& device);

    // Request data to be processed.
    void process(const std::vector<float>& data);

    // Wait for ready prediction. Order is preserved.
    void get(std::vector<float>& prediction);

    unsigned int nireq;

 private:
    Core ie;
    std::string outputName;
    ExecutableNetwork execNet;
    std::queue<InferRequest::Ptr> requests;
    std::queue<InferRequest::Ptr> idleRequests;
    
    std::queue<std::vector<float> > predictions;
    std::mutex predictionsMutex;
    std::condition_variable prediction_ready;
    std::thread worker;
 };

 int main(int argc, char** argv) {
    const int num = 100;
    OpenVINOLauncher launcher(argv[1], argv[2]);

    // This thread imitates input data source
    std::thread dataThread([&](){
        std::vector<float> inputData(1*3*224*224);
        for (int i = 0; i < num; ++i) {
            launcher.process(inputData);
            std::this_thread::sleep_for(std::chrono::milliseconds(1));
        }
    });

    // Retrieve predictions
    timeval start, end;
    gettimeofday(&start, 0);
    std::vector<float> prediction;
    // TODO: process last <nireq> predictions
    for (int i = 0; i < num - launcher.nireq; ++i) {
        launcher.get(prediction);
    }
    gettimeofday(&end, 0);
    std::cout << "FPS: " << num / ((end.tv_sec - start.tv_sec) +
                                   (end.tv_usec - start.tv_usec) * 1e-6) << std::endl;
    dataThread.join();
    return 0;
 }

 OpenVINOLauncher::OpenVINOLauncher(const std::string& xmlPath, const std::string& device) {
    CNNNetwork net = ie.ReadNetwork(xmlPath);

    std::map<std::string, std::string> config;
    if (device.find("CPU") != std::string::npos) {
        config["CPU_THROUGHPUT_STREAMS"] = "CPU_THROUGHPUT_AUTO";
    }
    if (device.find("GPU") != std::string::npos) {
        config["GPU_THROUGHPUT_STREAMS"] = "GPU_THROUGHPUT_AUTO";
    }
    execNet = ie.LoadNetwork(net, device, config);

    nireq = execNet.GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)).as<unsigned int>();
    outputName = net.getOutputsInfo().begin()->first;

    std::cout << "Inference requests: " << nireq << std::endl;
    for (int i = 0; i < nireq; ++i) {
        idleRequests.push(execNet.CreateInferRequestPtr());
    }
 }

 void OpenVINOLauncher::process(const std::vector<float>& input) {
    // Wait for readiness of the oldest inference requests if there is no
    // idle requests to process new input data.
    if (idleRequests.empty())
        requests.front()->Wait(IInferRequest::RESULT_READY);
 
    // Release top finished requests
    while (!requests.empty()) {
        auto req = requests.front();
        if (req->Wait(IInferRequest::STATUS_ONLY) != StatusCode::OK)  // if not ready
            break;

        Blob::Ptr out = req->GetBlob(outputName);
        float* data = out->buffer();

        std::unique_lock<std::mutex> lock(predictionsMutex);
        predictions.push(std::vector<float>(data, data + out->size()));
        prediction_ready.notify_one();

        requests.pop();
        idleRequests.push(req);
    }

    // Start a new request
    auto req = idleRequests.front();
    float* data = const_cast<float*>(input.data());
    Blob::Ptr inputBlob = make_shared_blob<float>(TensorDesc(Precision::FP32, {1, 3, 224, 224}, Layout::NCHW), data);
    req->SetBlob("input_1", inputBlob);
    req->StartAsync();
    idleRequests.pop();
    requests.push(req);
 }

 void OpenVINOLauncher::get(std::vector<float>& prediction) {
    std::unique_lock<std::mutex> lock(predictionsMutex);
    prediction_ready.wait(lock, [&]{ return !predictions.empty(); });
    prediction = predictions.front();
    predictions.pop();
 }
	cmake_minimum_required(VERSION 3.4.3)

	project(sample CXX)

	find_package(InferenceEngine REQUIRED)

	add_executable(${CMAKE_PROJECT_NAME} main.cpp)
	target_compile_features(${CMAKE_PROJECT_NAME} PRIVATE cxx_range_for)

	target_link_libraries(${CMAKE_PROJECT_NAME}
	${InferenceEngine_LIBRARIES}
	pthread
	)
	#include <queue>
	#include <mutex>
	#include <thread>
	#include <sys/time.h>
	#include <condition_variable>

	#include <inference_engine.hpp>

	using namespace InferenceEngine;

	class OpenVINOLauncher {
	public:
	OpenVINOLauncher(const std::string& xmlPath, const std::string& device);

	// Request data to be processed.
	void process(const std::vector<float>& data);

	// Wait for ready prediction. Order is preserved.
	void get(std::vector<float>& prediction);

	unsigned int nireq;

	private:
	Core ie;
	std::string outputName;
	ExecutableNetwork execNet;
	std::queue<InferRequest::Ptr> requests;
	std::queue<InferRequest::Ptr> idleRequests;

	std::queue<std::vector<float> > predictions;
	std::mutex predictionsMutex;
	std::condition_variable prediction_ready;
	std::thread worker;
	};

	int main(int argc, char** argv) {
	const int num = 100;
	OpenVINOLauncher launcher(argv[1], argv[2]);

	// This thread imitates input data source
	std::thread dataThread([&](){
	std::vector<float> inputData(13224*224);
	for (int i = 0; i < num; ++i) {
	launcher.process(inputData);
	std::this_thread::sleep_for(std::chrono::milliseconds(1));
	}
	});

	// Retrieve predictions
	timeval start, end;
	gettimeofday(&start, 0);
	std::vector<float> prediction;
	// TODO: process last <nireq> predictions
	for (int i = 0; i < num - launcher.nireq; ++i) {
	launcher.get(prediction);
	}
	gettimeofday(&end, 0);
	std::cout << "FPS: " << num / ((end.tv_sec - start.tv_sec) +
	(end.tv_usec - start.tv_usec) * 1e-6) << std::endl;
	dataThread.join();
	return 0;
	}

	OpenVINOLauncher::OpenVINOLauncher(const std::string& xmlPath, const std::string& device) {
	CNNNetwork net = ie.ReadNetwork(xmlPath);

	std::map<std::string, std::string> config;
	if (device.find("CPU") != std::string::npos) {
	config["CPU_THROUGHPUT_STREAMS"] = "CPU_THROUGHPUT_AUTO";
	}
	if (device.find("GPU") != std::string::npos) {
	config["GPU_THROUGHPUT_STREAMS"] = "GPU_THROUGHPUT_AUTO";
	}
	execNet = ie.LoadNetwork(net, device, config);

	nireq = execNet.GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)).as<unsigned int>();
	outputName = net.getOutputsInfo().begin()->first;

	std::cout << "Inference requests: " << nireq << std::endl;
	for (int i = 0; i < nireq; ++i) {
	idleRequests.push(execNet.CreateInferRequestPtr());
	}
	}

	void OpenVINOLauncher::process(const std::vector<float>& input) {
	// Wait for readiness of the oldest inference requests if there is no
	// idle requests to process new input data.
	if (idleRequests.empty())
	requests.front()->Wait(IInferRequest::RESULT_READY);

	// Release top finished requests
	while (!requests.empty()) {
	auto req = requests.front();
	if (req->Wait(IInferRequest::STATUS_ONLY) != StatusCode::OK) // if not ready
	break;

	Blob::Ptr out = req->GetBlob(outputName);
	float* data = out->buffer();

	std::unique_lock<std::mutex> lock(predictionsMutex);
	predictions.push(std::vector<float>(data, data + out->size()));
	prediction_ready.notify_one();

	requests.pop();
	idleRequests.push(req);
	}

	// Start a new request
	auto req = idleRequests.front();
	float* data = const_cast<float*>(input.data());
	Blob::Ptr inputBlob = make_shared_blob<float>(TensorDesc(Precision::FP32, {1, 3, 224, 224}, Layout::NCHW), data);
	req->SetBlob("input_1", inputBlob);
	req->StartAsync();
	idleRequests.pop();
	requests.push(req);
	}

	void OpenVINOLauncher::get(std::vector<float>& prediction) {
	std::unique_lock<std::mutex> lock(predictionsMutex);
	prediction_ready.wait(lock, [&]{ return !predictions.empty(); });
	prediction = predictions.front();
	predictions.pop();
	}