inference/inference3.h


#ifndef INFERENCE_FRAMEWORK_INFERENCE3_H
#define INFERENCE_FRAMEWORK_INFERENCE3_H

#include "bmutility.h"
#include "thread_queue.h"
namespace bm {
    template<typename T1, typename T2>
    class MediaDelegate {
    public:
        virtual ~MediaDelegate() {}

        virtual int stitch(std::vector<T2>& frames, std::vector<T1>& output) = 0;
        virtual int encode(std::vector<T1>& frames) = 0;
    };

    struct MediaParam {
        MediaParam() {}

        int stitch_queue_size;
        int stitch_thread_num;

        int encode_queue_size;
        int encode_thread_num;

        bool stitch_blocking_push;
        bool encode_blocking_push;

    };

    // for one thread mode
    template<typename T1, typename T2>
    class BMMediaPipeline {
        std::shared_ptr<MediaDelegate<T1, T2>> m_media_delegate;

        std::shared_ptr<BlockingQueue<T2>> m_stitchQue;
        WorkerPool<T2> m_stitchWorkerPool;

        std::shared_ptr<BlockingQueue<T1>> m_encodeQue;
        WorkerPool<T1> m_encodeWorkerPool;

    public:

        BMMediaPipeline() {

        }

        virtual ~BMMediaPipeline() {

        }

        void flow_control(std::function<void(T2& obj)> fn1,
                          std::function<void(T1& obj)> fn2) {
            m_stitchQue->set_drop_fn(fn1);
            m_encodeQue->set_drop_fn(fn2);
        }

        template<typename... T>
        int init(const MediaParam &param, std::shared_ptr<MediaDelegate<T1, T2>> delegate, T&&... args) {
            m_media_delegate = delegate;

            const int underlying_type_std_queue = 0;
            m_stitchQue = std::make_shared<BlockingQueue<T2>>(
                    "stitch", underlying_type_std_queue,
                    param.stitch_queue_size);

            m_stitchWorkerPool.init(m_stitchQue.get(), 1, 1,
                                    1);
            m_stitchWorkerPool.startWork([this, &param](std::vector<T2> &items) {
                std::vector<T1> frames;
                m_media_delegate->stitch(items, frames);
                this->m_encodeQue->push(frames);
            });

            m_encodeQue = std::make_shared<BlockingQueue<T1>>(
                    "encode", underlying_type_std_queue,
                    param.encode_queue_size);

            m_encodeWorkerPool.init(m_encodeQue.get(), 1, 1, 8);
            m_encodeWorkerPool.startWork([this, &param](std::vector<T1> &items) {
                m_media_delegate->encode(items);
            });

            flow_control(std::forward<T>(args)...);
            return 0;
        }

        int flush_frame() {
            m_stitchWorkerPool.flush();
            return 0;
        }

        int push_frame(T2& frame) {
            m_stitchQue->push(frame);
            return 0;
        }

        int push_frame(T1 *frame) {
            m_stitchQue->push(*frame);
            return 0;
        }
    };

    template<typename T1, typename T2>
    class DetectorDelegate {
    protected:
        using DetectedFinishFunc = std::function<void(T2 &of)>;
        DetectedFinishFunc m_pfnDetectFinish;
        BMMediaPipeline<T1, T2>* m_nextMediaPipe = nullptr;

    public:
        virtual ~DetectorDelegate() {}
        void set_next_inference_pipe(BMMediaPipeline<T1, T2> *nextPipe) { m_nextMediaPipe = nextPipe; }

        virtual void decode_process(T1 &) {
            // do nothing by default
        }

        virtual int preprocess(std::vector<T1> &frames, std::vector<T2> &of) = 0;

        virtual int forward(std::vector<T2> &frames) = 0;

        virtual int postprocess(std::vector<T2> &frames) = 0;

        virtual int set_detected_callback(DetectedFinishFunc func) { m_pfnDetectFinish = func; return 0;};
    };

    struct DetectorParam {
        DetectorParam() {
            preprocess_queue_size = 5;
            preprocess_thread_num = 4;

            inference_queue_size = 5;
            inference_thread_num = 1;

            postprocess_queue_size = 5;
            postprocess_thread_num = 2;
            batch_num=4;
        }

        int preprocess_queue_size;
        int preprocess_thread_num;

        int inference_queue_size;
        int inference_thread_num;

        int postprocess_queue_size;
        int postprocess_thread_num;
        int batch_num;

    };

    template<typename T1, typename T2>
    class BMInferencePipe {
        DetectorParam m_param;
        std::shared_ptr<DetectorDelegate<T1, T2>> m_detect_delegate;

        std::shared_ptr<BlockingQueue<T1>> m_preprocessQue;
        std::shared_ptr<BlockingQueue<T2>> m_postprocessQue;
        std::shared_ptr<BlockingQueue<T2>> m_forwardQue;

        WorkerPool<T1> m_preprocessWorkerPool;
        WorkerPool<T2> m_forwardWorkerPool;
        WorkerPool<T2> m_postprocessWorkerPool;


    public:
        BMInferencePipe() {

        }

        virtual ~BMInferencePipe() {

        }

        void flow_control(std::function<void(T1& obj)> fn1,
                          std::function<void(T2& obj)> fn2,
                          std::function<void(T2& obj)> fn3) {
            m_preprocessQue->set_drop_fn( fn1);
            m_forwardQue->set_drop_fn( fn2);
            m_postprocessQue->set_drop_fn( fn3);
        }

        template<typename... T>
        int init(const DetectorParam &param, std::shared_ptr<DetectorDelegate<T1, T2>> delegate, T&&... args) {
            m_param = param;
            m_detect_delegate = delegate;

            const int underlying_type_std_queue = 0;
            m_preprocessQue = std::make_shared<BlockingQueue<T1>>(
                    "preprocess", underlying_type_std_queue,
                    param.preprocess_queue_size);
            m_postprocessQue = std::make_shared<BlockingQueue<T2>>(
                    "postprocess", underlying_type_std_queue,
                    param.postprocess_queue_size);
            m_forwardQue = std::make_shared<BlockingQueue<T2>>(
                    "inference", underlying_type_std_queue,
                    param.inference_queue_size);

            m_preprocessWorkerPool.init(m_preprocessQue.get(), param.preprocess_thread_num, param.batch_num, param.batch_num);
            m_preprocessWorkerPool.startWork([this, &param](std::vector<T1> &items) {
                std::vector<T2> frames;
                m_detect_delegate->preprocess(items, frames);
                this->m_forwardQue->push(frames);
            });

            m_forwardWorkerPool.init(m_forwardQue.get(), param.inference_thread_num, 1, 8);
            m_forwardWorkerPool.startWork([this, &param](std::vector<T2> &items) {
                m_detect_delegate->forward(items);
                this->m_postprocessQue->push(items);
            });

            m_postprocessWorkerPool.init(m_postprocessQue.get(), param.postprocess_thread_num, 1, 8);
            m_postprocessWorkerPool.startWork([this, &param](std::vector<T2> &items) {
                m_detect_delegate->postprocess(items);
            });

            flow_control(std::forward<T>(args)...);

            return 0;
        }

        int flush_frame() {
            m_preprocessWorkerPool.flush();
            return 0;
        }

        int push_frame(T1 *frame) {
            m_preprocessQue->push(*frame);
            return 0;
        }
    };


} // end namespace bm


#endif //INFERENCE_FRAMEWORK_INFERENCE3_H