1 #include "../../StdAfx.h"
\r
3 #include "parallel_yadif.h"
\r
5 #include <common/log/log.h>
\r
7 #if defined(_MSC_VER)
\r
8 #pragma warning (push)
\r
9 #pragma warning (disable : 4244)
\r
13 #include <libavfilter/avfilter.h>
\r
15 #if defined(_MSC_VER)
\r
16 #pragma warning (pop)
\r
19 #include <tbb/parallel_for.h>
\r
20 #include <tbb/concurrent_queue.h>
\r
22 #include <boost/thread/once.hpp>
\r
29 AVFilterBufferRef *cur;
\r
30 AVFilterBufferRef *next;
\r
31 AVFilterBufferRef *prev;
\r
32 AVFilterBufferRef *out;
\r
33 void (*filter_line)(uint8_t *dst,
\r
34 uint8_t *prev, uint8_t *cur, uint8_t *next,
\r
35 int w, int prefs, int mrefs, int parity, int mode);
\r
36 //const AVPixFmtDescriptor *csp;
\r
39 struct parallel_yadif_context
\r
57 parallel_yadif_context() : index(0){}
\r
60 void (*org_yadif_filter_line)(uint8_t *dst, uint8_t *prev, uint8_t *cur, uint8_t *next, int w, int prefs, int mrefs, int parity, int mode) = 0;
\r
62 void parallel_yadif_filter_line(parallel_yadif_context& ctx, uint8_t *dst, uint8_t *prev, uint8_t *cur, uint8_t *next, int w, int prefs, int mrefs, int parity, int mode)
\r
64 parallel_yadif_context::arg arg = {dst, prev, cur, next, w, prefs, mrefs, parity, mode};
\r
65 ctx.args[ctx.index++] = arg;
\r
69 tbb::parallel_for(tbb::blocked_range<size_t>(0, ctx.index), [=](const tbb::blocked_range<size_t>& r)
\r
71 for(auto n = r.begin(); n != r.end(); ++n)
\r
72 org_yadif_filter_line(ctx.args[n].dst, ctx.args[n].prev, ctx.args[n].cur, ctx.args[n].next, ctx.args[n].w, ctx.args[n].prefs, ctx.args[n].mrefs, ctx.args[n].parity, ctx.args[n].mode);
\r
78 #define RENAME(a) f ## a
\r
81 void RENAME(x)(uint8_t *dst, uint8_t *prev, uint8_t *cur, uint8_t *next, int w, int prefs, int mrefs, int parity, int mode) \
\r
83 static parallel_yadif_context ctx;\
\r
84 parallel_yadif_filter_line(ctx, dst, prev, cur, next, w, prefs, mrefs, parity, mode);\
\r
87 ff(0); ff(1); ff(2); ff(3); ff(4); ff(5); ff(6); ff(7); ff(8); ff(9); ff(10); ff(11); ff(12); ff(13); ff(14); ff(15); ff(16); ff(17);
\r
89 void (*fs[])(uint8_t *dst, uint8_t *prev, uint8_t *cur, uint8_t *next, int w, int prefs, int mrefs, int parity, int mode) =
\r
90 {f0, f1, f2, f3, f4, f5, f6, f7, f8, f9, f10, f11, f12, f13, f14, f15, f16, f17};
\r
94 tbb::concurrent_bounded_queue<decltype(org_yadif_filter_line)> parallel_line_func_pool;
\r
98 for(int n = 0; n < sizeof(fs)/sizeof(fs[0]); ++n)
\r
99 parallel_line_func_pool.push(fs[n]);
\r
102 void return_parallel_yadif(void* func)
\r
104 if(func != nullptr)
\r
105 parallel_line_func_pool.push(reinterpret_cast<decltype(fs[0])>(func));
\r
108 std::shared_ptr<void> make_parallel_yadif(AVFilterContext* ctx, size_t height)
\r
110 if(height % 64 != 0)
\r
111 return std::shared_ptr<void>(nullptr, return_parallel_yadif);
\r
113 static boost::once_flag flag = BOOST_ONCE_INIT;
\r
114 boost::call_once(&init_pool, flag);
\r
116 YADIFContext* yadif = (YADIFContext*)ctx->priv;
\r
117 org_yadif_filter_line = yadif->filter_line; // Data race is not a problem.
\r
119 decltype(org_yadif_filter_line) func = nullptr;
\r
120 if(!parallel_line_func_pool.try_pop(func))
\r
121 CASPAR_LOG(warning) << "Not enough scalable-yadif context instances. Running non-scalable";
\r
123 yadif->filter_line = func;
\r
125 return std::shared_ptr<void>(func, return_parallel_yadif);
\r