OSSIA
Open Scenario System for Interactive Application
Loading...
Searching...
No Matches
sound_libav.hpp
1#pragma once
2#include <ossia/detail/config.hpp>
3
4#include <ossia/audio/audio_parameter.hpp>
5#include <ossia/dataflow/audio_stretch_mode.hpp>
6#include <ossia/dataflow/graph_node.hpp>
7#include <ossia/dataflow/nodes/media.hpp>
8#include <ossia/dataflow/nodes/sound.hpp>
9#include <ossia/dataflow/port.hpp>
10#include <ossia/detail/libav.hpp>
11#include <ossia/detail/pod_vector.hpp>
12
13#include <algorithm>
14#include <type_traits>
15
16extern "C" {
17#include <libavcodec/avcodec.h>
18#include <libavformat/avformat.h>
19#include <libavutil/frame.h>
20#include <libavutil/mem.h>
21#include <libswresample/swresample.h>
22}
23
24namespace ossia::nodes
25{
26class sound_libav final : public ossia::sound_node
27{
28 AVPacket* packet{};
29 AVFrame* frame{};
30
31public:
32 sound_libav()
33 : packet{av_packet_alloc()}
34 , frame{av_frame_alloc()}
35 {
36 m_outlets.push_back(&audio_out);
37 }
38
39 ~sound_libav()
40 {
41 m_handle.cleanup();
42
43 av_frame_free(&frame);
44 av_packet_free(&packet);
45 }
46
47 std::string label() const noexcept override { return "sound_libav"; }
48
49 void set_start(std::size_t v) { start = v; }
50
51 void set_upmix(std::size_t v) { upmix = v; }
52
53 void set_sound(libav_handle hdl)
54 {
55 using namespace snd;
56 m_handle.cleanup();
57 m_handle = std::move(hdl);
58
59 m_tmp.clear();
60 m_channel_q = boost::circular_buffer<float>(8192 * m_handle.channels());
61 }
62
63 void transport(time_value flicks) override
64 {
65 m_channel_q.clear();
66 ossia::seek_to_flick(
67 m_handle.format, m_handle.codec, m_handle.stream, flicks.impl, AVSEEK_FLAG_ANY);
68 }
69
70 void transport(time_value flicks, const ossia::tick_transport_info& tinfo) override
71 {
72 m_channel_q.clear();
73 // Scale flicks by |timeline_tempo| / file_tempo when stretching; otherwise
74 // seek at the raw model time. See file_sample_for_model_time.
75 int64_t target_flicks = flicks.impl;
76 const double abs_tempo = std::abs(tinfo.current_tempo);
77 if(m_resampler.stretch() && tempo > 0.0 && abs_tempo > 0.0)
78 {
79 target_flicks = int64_t(double(flicks.impl) * abs_tempo / tempo);
80 }
81 ossia::seek_to_flick(
82 m_handle.format, m_handle.codec, m_handle.stream, target_flicks,
83 AVSEEK_FLAG_ANY);
84 }
85
86 void fetch_from_libav(int samples_to_write)
87 {
88 const std::size_t channels = this->channels();
89 if(channels == 0)
90 return;
91
92 auto floats_to_write = channels * samples_to_write;
93 while(m_channel_q.size() < floats_to_write)
94 {
95 // FIXME this is buggy
96 if(m_channel_q.capacity() < 4 * floats_to_write)
97 {
98 m_channel_q.set_capacity(4 * floats_to_write);
99 }
100
101 // Need to fetch more data
102 auto fmt_ctx = m_handle.format;
103 auto codec_ctx = m_handle.codec;
104 auto stream = m_handle.stream;
105 {
106 int ret{};
107 {
108 av_packet_unref(packet);
109 ret = av_read_frame(fmt_ctx, packet);
110
111 while(ret >= 0 && ret != AVERROR(EOF) && packet->stream_index != stream->index)
112 {
113 av_packet_unref(packet);
114 ret = av_read_frame(fmt_ctx, packet);
115 }
116 if(ret == AVERROR(EOF))
117 {
118 break;
119 }
120 }
121 if(ret < 0)
122 {
123 return;
124 }
125
126 ret = avcodec_send_packet(codec_ctx, packet);
127 if(ret == 0)
128 {
129 ret = avcodec_receive_frame(codec_ctx, frame);
130 if(ret == 0)
131 {
132 const int samples = frame->nb_samples;
133 m_tmp.resize(samples * channels, boost::container::default_init);
134 float* out_ptr = m_tmp.data();
135 const int read_samples = swr_convert(
136 m_handle.resample, (uint8_t**)&out_ptr, samples,
137 (const uint8_t**)frame->extended_data, samples);
138
139 m_channel_q.insert(
140 m_channel_q.end(), out_ptr, out_ptr + read_samples * channels);
141 }
142 }
143 }
144 }
145 }
146
147 template <typename T>
148 void
149 fetch_audio(int64_t start, int64_t samples_to_write, T** audio_array_base) noexcept
150 {
151 const std::size_t channels = this->channels();
152 if(channels == 0)
153 return;
154
155 fetch_from_libav(samples_to_write);
156
157 // FIXME start offset
158 for(int k = 0; k < samples_to_write; k++)
159 {
160 for(std::size_t chan = 0; chan < channels; chan++)
161 {
162 if(m_channel_q.size() > 0)
163 {
164 audio_array_base[chan][k] = m_channel_q.front();
165 m_channel_q.pop_front();
166 }
167 else
168 {
169 audio_array_base[chan][k] = 0.;
170 }
171 }
172 }
173 }
174
175 template <typename T>
176 void fetch_audio_backward(
177 int64_t start, int64_t samples_to_write, T** audio_array_base) noexcept
178 {
179 const std::size_t channels = this->channels();
180 if(channels == 0)
181 return;
182
183 // For backward playback with libav:
184 // 1. Calculate the position we need to start reading from (going backwards)
185 // 2. Seek to that earlier position
186 // 3. Read forward
187 // 4. Reverse the samples
188
189 // Calculate backward start position
190 int64_t backward_start = start - samples_to_write + 1;
191 if(backward_start < 0)
192 backward_start = 0;
193
194 // Seek to the backward position
195 // Convert sample position to flicks for seeking
196 const int64_t sample_rate = m_handle.stream->codecpar->sample_rate;
197 if(sample_rate > 0)
198 {
199 // flicks = samples * flicks_per_second / sample_rate
200 constexpr int64_t flicks_per_second = 705600000LL;
201 int64_t flicks_pos = backward_start * flicks_per_second / sample_rate;
202
203 m_channel_q.clear();
204 ossia::seek_to_flick(
205 m_handle.format, m_handle.codec, m_handle.stream, flicks_pos, AVSEEK_FLAG_BACKWARD);
206 }
207
208 // Fetch the audio forward
209 fetch_from_libav(samples_to_write);
210
211 // Read into output, then reverse
212 for(int64_t k = 0; k < samples_to_write; k++)
213 {
214 for(std::size_t chan = 0; chan < channels; chan++)
215 {
216 if(m_channel_q.size() > 0)
217 {
218 audio_array_base[chan][k] = m_channel_q.front();
219 m_channel_q.pop_front();
220 }
221 else
222 {
223 audio_array_base[chan][k] = 0.;
224 }
225 }
226 }
227
228 // Reverse each channel in-place
229 for(std::size_t chan = 0; chan < channels; chan++)
230 {
231 std::reverse(audio_array_base[chan], audio_array_base[chan] + samples_to_write);
232 }
233 }
234
235 void run(const ossia::token_request& t, ossia::exec_state_facade e) noexcept override
236 {
237 if(!m_handle)
238 return;
239
240 const auto channels = m_handle.channels();
241 const auto len = m_handle.totalPCMFrameCount();
242
243 ossia::audio_port& ap = *audio_out;
244 ap.set_channels(std::max((std::size_t)upmix, (std::size_t)channels));
245
246 const auto [samples_to_read, samples_to_write]
247 = snd::sample_info(e.bufferSize(), e.modelToSamples(), t);
248 if(samples_to_write <= 0)
249 return;
250
251 assert(samples_to_write > 0);
252
253 const auto samples_offset = t.physical_start(e.modelToSamples());
254
255 if(t.forward())
256 {
257 if(t.prev_date < m_prev_date)
258 {
259 // First run after add_time_process() left the stretcher already
260 // primed; calling transport() again would reset it.
261 if(m_prev_date == ossia::time_value{ossia::time_value::infinite_min})
262 m_prev_date = t.prev_date;
263 else
264 transport(t.prev_date);
265 }
266 }
267 else
268 {
269 if(t.prev_date > m_prev_date)
270 {
271 if(m_prev_date == ossia::time_value{ossia::time_value::infinite_min})
272 m_prev_date = t.prev_date;
273 else
274 transport(t.prev_date);
275 }
276 }
277
278 for(int chan = 0; chan < channels; chan++)
279 {
280 ap.channel(chan).resize(e.bufferSize());
281 }
282
283 const double stretch_ratio = update_stretch(t, e);
284 const double abs_stretch_ratio = std::abs(stretch_ratio);
285
286 m_resampler.run(
287 *this, t, e, stretch_ratio, channels, len, samples_to_read, samples_to_write,
288 samples_offset, ap);
289
290 const bool start_discontinuous = t.start_discontinuous || (m_last_stretch > 70.);
291 const bool end_discontinuous = t.end_discontinuous || (abs_stretch_ratio > 70.);
292 if(abs_stretch_ratio > 70. && m_last_stretch > 70.)
293 {
294 [[unlikely]];
295 for(std::size_t i = 0; i < channels; i++)
296 {
297 ossia::snd::do_zero(ap.channel(i), samples_offset, samples_to_write);
298 }
299 }
300 else
301 {
302 [[likely]];
303 for(int chan = 0; chan < channels; chan++)
304 {
305 // fade
306 snd::do_fade(
307 start_discontinuous, end_discontinuous, ap.channel(chan), samples_offset,
308 samples_to_write);
309 }
310 }
311
312 ossia::snd::perform_upmix(this->upmix, channels, ap);
313 ossia::snd::perform_start_offset(this->start, ap);
314
315 m_prev_date = t.date;
316 m_last_stretch = abs_stretch_ratio;
317 }
318
319 [[nodiscard]] std::size_t channels() const
320 {
321 return m_handle ? m_handle.channels() : 0;
322 }
323 [[nodiscard]] std::size_t duration() const
324 {
325 return m_handle ? m_handle.totalPCMFrameCount() : 0;
326 }
327
328private:
329 libav_handle m_handle{};
330
331 ossia::audio_outlet audio_out;
332
333 std::size_t start{};
334 std::size_t upmix{};
335
336 ossia::pod_vector<float> m_tmp{};
337 boost::circular_buffer<float> m_channel_q;
338};
339
340}
The time_value class.
Definition ossia/editor/scenario/time_value.hpp:30