2 * Copyright 2013 Sveriges Television AB http://casparcg.com/
\r
4 * This file is part of CasparCG (www.casparcg.com).
\r
6 * CasparCG is free software: you can redistribute it and/or modify
\r
7 * it under the terms of the GNU General Public License as published by
\r
8 * the Free Software Foundation, either version 3 of the License, or
\r
9 * (at your option) any later version.
\r
11 * CasparCG is distributed in the hope that it will be useful,
\r
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
\r
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
\r
14 * GNU General Public License for more details.
\r
16 * You should have received a copy of the GNU General Public License
\r
17 * along with CasparCG. If not, see <http://www.gnu.org/licenses/>.
\r
19 * Author: Robert Nagy, ronag89@gmail.com
\r
22 #include "../../stdafx.h"
\r
24 #include "audio_mixer.h"
\r
26 #include <core/mixer/write_frame.h>
\r
27 #include <core/producer/frame/frame_transform.h>
\r
28 #include <common/diagnostics/graph.h>
\r
29 #include "audio_util.h"
\r
31 #include <tbb/cache_aligned_allocator.h>
\r
33 #include <boost/range/adaptors.hpp>
\r
34 #include <boost/range/distance.hpp>
\r
40 namespace caspar { namespace core {
\r
45 frame_transform transform;
\r
46 audio_buffer audio_data;
\r
52 audio_item(audio_item&& other)
\r
53 : tag(std::move(other.tag))
\r
54 , transform(std::move(other.transform))
\r
55 , audio_data(std::move(other.audio_data))
\r
60 typedef std::vector<float, tbb::cache_aligned_allocator<float>> audio_buffer_ps;
\r
64 frame_transform prev_transform;
\r
65 audio_buffer_ps audio_data;
\r
68 struct audio_mixer::implementation
\r
70 safe_ptr<diagnostics::graph> graph_;
\r
71 std::stack<core::frame_transform> transform_stack_;
\r
72 std::map<const void*, audio_stream> audio_streams_;
\r
73 std::vector<audio_item> items_;
\r
74 std::vector<size_t> audio_cadence_;
\r
75 video_format_desc format_desc_;
\r
76 channel_layout channel_layout_;
\r
77 float master_volume_;
\r
78 float previous_master_volume_;
\r
81 implementation(const safe_ptr<diagnostics::graph>& graph)
\r
83 , format_desc_(video_format_desc::get(video_format::invalid))
\r
84 , channel_layout_(channel_layout::stereo())
\r
85 , master_volume_(1.0f)
\r
86 , previous_master_volume_(master_volume_)
\r
88 graph_->set_color("volume", diagnostics::color(1.0f, 0.8f, 0.1f));
\r
89 transform_stack_.push(core::frame_transform());
\r
92 void begin(core::basic_frame& frame)
\r
94 transform_stack_.push(transform_stack_.top()*frame.get_frame_transform());
\r
97 void visit(core::write_frame& frame)
\r
99 if(transform_stack_.top().volume < 0.002 || frame.audio_data().empty())
\r
103 item.tag = frame.tag();
\r
104 item.transform = transform_stack_.top();
\r
106 if (needs_rearranging(frame.get_channel_layout(), channel_layout_))
\r
108 auto src_view = frame.get_multichannel_view();
\r
110 audio_buffer rearranged_buffer;
\r
111 rearranged_buffer.resize(
\r
112 src_view.num_samples() * channel_layout_.num_channels);
\r
114 auto dst_view = make_multichannel_view<int32_t>(
\r
115 rearranged_buffer.begin(),
\r
116 rearranged_buffer.end(),
\r
119 bool rearrange_success = rearrange_or_rearrange_and_mix(
\r
120 src_view, dst_view, default_mix_config_repository());
\r
122 if (!rearrange_success)
\r
124 failed_rearrange(item.tag, src_view.channel_layout());
\r
127 item.audio_data = std::move(rearranged_buffer);
\r
131 item.audio_data = std::move(frame.audio_data()); // Note: We don't need to care about upper/lower since audio_data is removed/moved from the last field.
\r
134 items_.push_back(std::move(item));
\r
137 void begin(const core::frame_transform& transform)
\r
139 transform_stack_.push(transform_stack_.top()*transform);
\r
144 transform_stack_.pop();
\r
147 float get_master_volume() const
\r
149 return master_volume_;
\r
152 void set_master_volume(float volume)
\r
154 master_volume_ = volume;
\r
157 audio_buffer mix(const video_format_desc& format_desc, const channel_layout& layout)
\r
159 if(format_desc_ != format_desc)
\r
161 audio_streams_.clear();
\r
162 audio_cadence_ = format_desc.audio_cadence;
\r
163 format_desc_ = format_desc;
\r
164 channel_layout_ = layout;
\r
167 std::map<const void*, audio_stream> next_audio_streams;
\r
169 BOOST_FOREACH(auto& item, items_)
\r
171 audio_buffer_ps next_audio;
\r
173 auto next_transform = item.transform;
\r
174 auto prev_transform = next_transform;
\r
176 const auto it = audio_streams_.find(item.tag);
\r
177 if(it != audio_streams_.end())
\r
179 prev_transform = it->second.prev_transform;
\r
180 next_audio = std::move(it->second.audio_data);
\r
183 if(prev_transform.volume < 0.001 && next_transform.volume < 0.001)
\r
186 const float prev_volume = static_cast<float>(prev_transform.volume) * previous_master_volume_;
\r
187 const float next_volume = static_cast<float>(next_transform.volume) * master_volume_;
\r
189 auto alpha = (next_volume-prev_volume)/static_cast<float>(item.audio_data.size()/channel_layout_.num_channels);
\r
191 for(size_t n = 0; n < item.audio_data.size(); ++n)
\r
193 auto sample_multiplier = (prev_volume + (n/channel_layout_.num_channels) * alpha);
\r
194 next_audio.push_back(item.audio_data[n] * sample_multiplier);
\r
197 next_audio_streams[item.tag].prev_transform = std::move(next_transform); // Store all active tags, inactive tags will be removed at the end.
\r
198 next_audio_streams[item.tag].audio_data = std::move(next_audio);
\r
201 previous_master_volume_ = master_volume_;
\r
204 audio_streams_ = std::move(next_audio_streams);
\r
206 if(audio_streams_.empty())
\r
207 audio_streams_[nullptr].audio_data = audio_buffer_ps(audio_size(audio_cadence_.front()), 0.0f);
\r
211 auto nb_invalid_streams = boost::count_if(audio_streams_ | boost::adaptors::map_values, [&](const audio_stream& x)
\r
213 return x.audio_data.size() < audio_size(audio_cadence_.front());
\r
216 if(nb_invalid_streams > 0)
\r
217 CASPAR_LOG(trace) << "[audio_mixer] Incorrect frame audio cadence detected.";
\r
220 std::vector<float> result_ps(audio_size(audio_cadence_.front()), 0.0f);
\r
222 BOOST_FOREACH(auto& stream, audio_streams_ | boost::adaptors::map_values)
\r
224 //CASPAR_LOG(debug) << stream.audio_data.size() << L" : " << result_ps.size();
\r
226 if(stream.audio_data.size() < result_ps.size())
\r
228 stream.audio_data.resize(result_ps.size(), 0.0f);
\r
229 CASPAR_LOG(trace) << L"[audio_mixer] Appended zero samples";
\r
232 auto out = boost::range::transform(result_ps, stream.audio_data, std::begin(result_ps), std::plus<float>());
\r
233 stream.audio_data.erase(std::begin(stream.audio_data), std::begin(stream.audio_data) + std::distance(std::begin(result_ps), out));
\r
236 boost::range::rotate(audio_cadence_, std::begin(audio_cadence_)+1);
\r
238 audio_buffer result;
\r
239 result.reserve(result_ps.size());
\r
240 boost::range::transform(result_ps, std::back_inserter(result), [](float sample){return static_cast<int32_t>(sample);});
\r
242 auto max = boost::range::max_element(result);
\r
244 graph_->set_value("volume", static_cast<double>(std::abs(*max))/std::numeric_limits<int32_t>::max());
\r
249 size_t audio_size(size_t num_samples) const
\r
251 return num_samples * channel_layout_.num_channels;
\r
254 void failed_rearrange(const void* tag, const channel_layout& layout)
\r
256 if (audio_streams_.find(tag) != audio_streams_.end())
\r
257 return; // We don't want to flood the logs.
\r
259 CASPAR_LOG(warning)
\r
260 << L"[audio_mixer] Could not satisfactory down/upmix from "
\r
261 << layout.name << L" to " << channel_layout_.name
\r
262 << L" because no mix config was found for "
\r
263 << layout.layout_type << L" => " << channel_layout_.layout_type
\r
264 << L". This might cause audio to be lost.";
\r
268 audio_mixer::audio_mixer(const safe_ptr<diagnostics::graph>& graph) : impl_(new implementation(graph)){}
\r
269 void audio_mixer::begin(core::basic_frame& frame){impl_->begin(frame);}
\r
270 void audio_mixer::visit(core::write_frame& frame){impl_->visit(frame);}
\r
271 void audio_mixer::end(){impl_->end();}
\r
272 float audio_mixer::get_master_volume() const { return impl_->get_master_volume(); }
\r
273 void audio_mixer::set_master_volume(float volume) { impl_->set_master_volume(volume); }
\r
274 audio_buffer audio_mixer::operator()(const video_format_desc& format_desc, const channel_layout& layout){return impl_->mix(format_desc, layout);}
\r