- \r
- tbb::parallel_for\r
- (\r
- tbb::blocked_range<size_t>(0, format_desc_.audio_samples_per_frame/4),\r
- [&](const tbb::blocked_range<size_t>& r)\r
- { \r
- auto alpha_ps = _mm_setr_ps(delta, delta, 0.0f, 0.0f);\r
- auto delta2_ps = _mm_set_ps1(delta*2.0f);\r
- auto prev_ps = _mm_set_ps1(prev_volume);\r
- auto next_ps = _mm_set_ps1(next_volume); \r
-\r
- for(size_t n = r.begin(); n < r.end(); ++n)\r
- { \r
- auto next2_ps = _mm_mul_ps(next_ps, alpha_ps);\r
- auto prev2_ps = _mm_sub_ps(prev_ps, _mm_mul_ps(prev_ps, alpha_ps));\r
- auto volume_ps = _mm_add_ps(next2_ps, prev2_ps);\r
-\r
- auto sample_ps = _mm_cvtepi32_ps(_mm_load_si128(reinterpret_cast<__m128i*>(&item.audio_data[n*4])));\r
- auto res_sample_ps = _mm_load_ps(&intermediate[n*4]); \r
- sample_ps = _mm_mul_ps(sample_ps, volume_ps); \r
- res_sample_ps = _mm_add_ps(sample_ps, res_sample_ps); \r
-\r
- alpha_ps = _mm_add_ps(alpha_ps, delta2_ps);\r
-\r
- _mm_store_ps(&intermediate[n*4], res_sample_ps);\r
- }\r
- }\r
- , ap);\r
+ \r
+ auto alpha_ps = _mm_setr_ps(delta, delta, 0.0f, 0.0f);\r
+ auto delta2_ps = _mm_set_ps1(delta*2.0f);\r
+ auto prev_ps = _mm_set_ps1(prev_volume);\r
+ auto next_ps = _mm_set_ps1(next_volume); \r
+\r
+ for(size_t n = 0; n < format_desc_.audio_samples_per_frame/4; ++n)\r
+ { \r
+ auto next2_ps = _mm_mul_ps(next_ps, alpha_ps);\r
+ auto prev2_ps = _mm_sub_ps(prev_ps, _mm_mul_ps(prev_ps, alpha_ps));\r
+ auto volume_ps = _mm_add_ps(next2_ps, prev2_ps);\r
+\r
+ auto sample_ps = _mm_cvtepi32_ps(_mm_load_si128(reinterpret_cast<__m128i*>(&item.audio_data[n*4])));\r
+ auto res_sample_ps = _mm_load_ps(&intermediate[n*4]); \r
+ sample_ps = _mm_mul_ps(sample_ps, volume_ps); \r
+ res_sample_ps = _mm_add_ps(sample_ps, res_sample_ps); \r
+\r
+ alpha_ps = _mm_add_ps(alpha_ps, delta2_ps);\r
+\r
+ _mm_store_ps(&intermediate[n*4], res_sample_ps);\r
+ }\r