2 * copyright (c) 2010 Sveriges Television AB <info@casparcg.com>
\r
4 * This file is part of CasparCG.
\r
6 * CasparCG is free software: you can redistribute it and/or modify
\r
7 * it under the terms of the GNU General Public License as published by
\r
8 * the Free Software Foundation, either version 3 of the License, or
\r
9 * (at your option) any later version.
\r
11 * CasparCG is distributed in the hope that it will be useful,
\r
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
\r
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
\r
14 * GNU General Public License for more details.
\r
16 * You should have received a copy of the GNU General Public License
\r
17 * along with CasparCG. If not, see <http://www.gnu.org/licenses/>.
\r
21 #include "../stdafx.h"
\r
23 #include "copy_field.h"
\r
27 #include <functional>
\r
29 #include "../utility/types.h"
\r
31 #include "tbb/parallel_for.h"
\r
32 #include "tbb/blocked_range.h"
\r
34 using namespace std::tr1::placeholders;
\r
36 namespace caspar{ namespace common{ namespace image{
\r
38 void Docopy_fieldParallel(size_t index, const std::tr1::function<void(void*, const void*, size_t)>& func, void* dest, const void* source, size_t width4)
\r
40 size_t offset = index*width4;
\r
41 size_t size = width4;
\r
42 func(reinterpret_cast<s8*>(dest) + offset, reinterpret_cast<const s8*>(source) + offset, size);
\r
45 void copy_fieldParallel(const std::tr1::function<void(void*, const void*, size_t)>& func, void* dest, const void* source, size_t fieldIndex, size_t width, size_t height)
\r
47 tbb::parallel_for(fieldIndex, height, static_cast<size_t>(2), std::bind(&Docopy_fieldParallel, std::placeholders::_1, func, dest, source, width*4)); // copy for each row
\r
50 copy_field_fun get_copy_field_fun(SIMD /*simd*/)
\r
53 // return copy_fieldParallel_SSE2;
\r
55 return copy_fieldParallel_REF; // REF is faster
\r
58 void copy_fieldParallel_SSE2(unsigned char* dest, const unsigned char* source, size_t fieldIndex, size_t width, size_t height)
\r
60 copy_fieldParallel(©_SSE2, dest, source, fieldIndex, width, height);
\r
63 void copy_field_REF(unsigned char* pDest, const unsigned char* pSrc, size_t fieldIndex, size_t width, size_t height)
\r
65 for(size_t rowIndex=fieldIndex; rowIndex < height; rowIndex+=2)
\r
67 int offset = width*4*rowIndex;
\r
68 __movsd(reinterpret_cast<unsigned long*>(&(pDest[offset])), reinterpret_cast<const unsigned long*>(&(pSrc[offset])), width);
\r
72 void copy_fieldParallel_REF(unsigned char* dest, const unsigned char* source, size_t fieldIndex, size_t width, size_t height)
\r
74 copy_fieldParallel(©_REF, dest, source, fieldIndex, width, height);
\r