2 * Inter-thread scheduling/synchronization.
3 * Copyright (c) 2023 Anton Khirnov
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22 #ifndef FFTOOLS_FFMPEG_SCHED_H
23 #define FFTOOLS_FFMPEG_SCHED_H
28 #include "ffmpeg_utils.h"
31 * This file contains the API for the transcode scheduler.
33 * Overall architecture of the transcoding process involves instances of the
34 * following components:
35 * - demuxers, each containing any number of demuxed streams; demuxed packets
36 * belonging to some stream are sent to any number of decoders (transcoding)
37 * and/or muxers (streamcopy);
38 * - decoders, which receive encoded packets from some demuxed stream or
39 * encoder, decode them, and send decoded frames to any number of filtergraph
40 * inputs (audio/video) or encoders (subtitles);
41 * - filtergraphs, each containing zero or more inputs (0 in case the
42 * filtergraph contains a lavfi source filter), and one or more outputs; the
43 * inputs and outputs need not have matching media types;
44 * each filtergraph input receives decoded frames from some decoder or another
46 * filtered frames from each output are sent to some encoder;
47 * - encoders, which receive decoded frames from some decoder (subtitles) or
48 * some filtergraph output (audio/video), encode them, and send encoded
49 * packets to any number of muxed streams or decoders;
50 * - muxers, each containing any number of muxed streams; each muxed stream
51 * receives encoded packets from some demuxed stream (streamcopy) or some
52 * encoder (transcoding); those packets are interleaved and written out by the
55 * The structure formed by the above components is a directed acyclic graph
56 * (absence of cycles is checked at startup).
58 * There must be at least one muxer instance, otherwise the transcode produces
59 * no output and is meaningless. Otherwise, in a generic transcoding scenario
60 * there may be arbitrary number of instances of any of the above components,
61 * interconnected in various ways.
63 * The code tries to keep all the output streams across all the muxers in sync
64 * (i.e. at the same DTS), which is accomplished by varying the rates at which
65 * packets are read from different demuxers and lavfi sources. Note that the
66 * degree of control we have over synchronization is fundamentally limited - if
67 * some demuxed streams in the same input are interleaved at different rates
68 * than that at which they are to be muxed (e.g. because an input file is badly
69 * interleaved, or the user changed their speed by mismatching amounts), then
70 * there will be increasing amounts of buffering followed by eventual
71 * transcoding failure.
73 * N.B. 1: there are meaningful transcode scenarios with no demuxers, e.g.
74 * - encoding and muxing output from filtergraph(s) that have no inputs;
75 * - creating a file that contains nothing but attachments and/or metadata.
77 * N.B. 2: a filtergraph output could, in principle, feed multiple encoders, but
78 * this is unnecessary because the (a)split filter provides the same
81 * The scheduler, in the above model, is the master object that oversees and
82 * facilitates the transcoding process. The basic idea is that all instances
83 * of the abovementioned components communicate only with the scheduler and not
84 * with each other. The scheduler is then the single place containing the
85 * knowledge about the whole transcoding pipeline.
91 typedef struct Scheduler Scheduler
;
93 enum SchedulerNodeType
{
94 SCH_NODE_TYPE_NONE
= 0,
99 SCH_NODE_TYPE_FILTER_IN
,
100 SCH_NODE_TYPE_FILTER_OUT
,
103 typedef struct SchedulerNode
{
104 enum SchedulerNodeType type
;
109 typedef int (*SchThreadFunc
)(void *arg
);
111 #define SCH_DSTREAM(file, stream) \
112 (SchedulerNode){ .type = SCH_NODE_TYPE_DEMUX, \
113 .idx = file, .idx_stream = stream }
114 #define SCH_MSTREAM(file, stream) \
115 (SchedulerNode){ .type = SCH_NODE_TYPE_MUX, \
116 .idx = file, .idx_stream = stream }
117 #define SCH_DEC_IN(decoder) \
118 (SchedulerNode){ .type = SCH_NODE_TYPE_DEC, \
120 #define SCH_DEC_OUT(decoder, out_idx) \
121 (SchedulerNode){ .type = SCH_NODE_TYPE_DEC, \
122 .idx = decoder, .idx_stream = out_idx }
123 #define SCH_ENC(encoder) \
124 (SchedulerNode){ .type = SCH_NODE_TYPE_ENC, \
126 #define SCH_FILTER_IN(filter, input) \
127 (SchedulerNode){ .type = SCH_NODE_TYPE_FILTER_IN, \
128 .idx = filter, .idx_stream = input }
129 #define SCH_FILTER_OUT(filter, output) \
130 (SchedulerNode){ .type = SCH_NODE_TYPE_FILTER_OUT, \
131 .idx = filter, .idx_stream = output }
133 Scheduler
*sch_alloc(void);
134 void sch_free(Scheduler
**sch
);
136 int sch_start(Scheduler
*sch
);
137 int sch_stop(Scheduler
*sch
, int64_t *finish_ts
);
140 * Wait until transcoding terminates or the specified timeout elapses.
142 * @param timeout_us Amount of time in microseconds after which this function
144 * @param transcode_ts Current transcode timestamp in AV_TIME_BASE_Q, for
145 * informational purposes only.
147 * @retval 0 waiting timed out, transcoding is not finished
148 * @retval 1 transcoding is finished
150 int sch_wait(Scheduler
*sch
, uint64_t timeout_us
, int64_t *transcode_ts
);
153 * Add a demuxer to the scheduler.
155 * @param func Function executed as the demuxer task.
156 * @param ctx Demuxer state; will be passed to func and used for logging.
158 * @retval ">=0" Index of the newly-created demuxer.
159 * @retval "<0" Error code.
161 int sch_add_demux(Scheduler
*sch
, SchThreadFunc func
, void *ctx
);
163 * Add a demuxed stream for a previously added demuxer.
165 * @param demux_idx index previously returned by sch_add_demux()
167 * @retval ">=0" Index of the newly-created demuxed stream.
168 * @retval "<0" Error code.
170 int sch_add_demux_stream(Scheduler
*sch
, unsigned demux_idx
);
173 * Add a decoder to the scheduler.
175 * @param func Function executed as the decoder task.
176 * @param ctx Decoder state; will be passed to func and used for logging.
177 * @param send_end_ts The decoder will return an end timestamp after flush packets
178 * are delivered to it. See documentation for
179 * sch_dec_receive() for more details.
181 * @retval ">=0" Index of the newly-created decoder.
182 * @retval "<0" Error code.
184 int sch_add_dec(Scheduler
*sch
, SchThreadFunc func
, void *ctx
, int send_end_ts
);
187 * Add another output to decoder (e.g. for multiview video).
189 * @retval ">=0" Index of the newly-added decoder output.
190 * @retval "<0" Error code.
192 int sch_add_dec_output(Scheduler
*sch
, unsigned dec_idx
);
195 * Add a filtergraph to the scheduler.
197 * @param nb_inputs Number of filtergraph inputs.
198 * @param nb_outputs number of filtergraph outputs
199 * @param func Function executed as the filtering task.
200 * @param ctx Filter state; will be passed to func and used for logging.
202 * @retval ">=0" Index of the newly-created filtergraph.
203 * @retval "<0" Error code.
205 int sch_add_filtergraph(Scheduler
*sch
, unsigned nb_inputs
, unsigned nb_outputs
,
206 SchThreadFunc func
, void *ctx
);
209 * Add a muxer to the scheduler.
211 * Note that muxer thread startup is more complicated than for other components,
213 * - muxer streams fed by audio/video encoders become initialized dynamically at
214 * runtime, after those encoders receive their first frame and initialize
215 * themselves, followed by calling sch_mux_stream_ready()
216 * - the header can be written after all the streams for a muxer are initialized
217 * - we may need to write an SDP, which must happen
218 * - AFTER all the headers are written
219 * - BEFORE any packets are written by any muxer
220 * - with all the muxers quiescent
221 * To avoid complicated muxer-thread synchronization dances, we postpone
222 * starting the muxer threads until after the SDP is written. The sequence of
223 * events is then as follows:
224 * - After sch_mux_stream_ready() is called for all the streams in a given muxer,
225 * the header for that muxer is written (care is taken that headers for
226 * different muxers are not written concurrently, since they write file
227 * information to stderr). If SDP is not wanted, the muxer thread then starts
229 * - When SDP _is_ wanted, no muxer threads start until the header for the last
230 * muxer is written. After that, the SDP is written, after which all the muxer
231 * threads are started at once.
233 * In order for the above to work, the scheduler needs to be able to invoke
234 * just writing the header, which is the reason the init parameter exists.
236 * @param func Function executed as the muxing task.
237 * @param init Callback that is called to initialize the muxer and write the
238 * header. Called after sch_mux_stream_ready() is called for all the
239 * streams in the muxer.
240 * @param ctx Muxer state; will be passed to func/init and used for logging.
241 * @param sdp_auto Determines automatic SDP writing - see sch_sdp_filename().
242 * @param thread_queue_size number of packets that can be buffered before
243 * sending to the muxer blocks
245 * @retval ">=0" Index of the newly-created muxer.
246 * @retval "<0" Error code.
248 int sch_add_mux(Scheduler
*sch
, SchThreadFunc func
, int (*init
)(void *),
249 void *ctx
, int sdp_auto
, unsigned thread_queue_size
);
252 * Default size of a packet thread queue. For muxing this can be overridden by
253 * the thread_queue_size option as passed to a call to sch_add_mux().
255 #define DEFAULT_PACKET_THREAD_QUEUE_SIZE 8
258 * Default size of a frame thread queue.
260 #define DEFAULT_FRAME_THREAD_QUEUE_SIZE 8
263 * Add a muxed stream for a previously added muxer.
265 * @param mux_idx index previously returned by sch_add_mux()
267 * @retval ">=0" Index of the newly-created muxed stream.
268 * @retval "<0" Error code.
270 int sch_add_mux_stream(Scheduler
*sch
, unsigned mux_idx
);
273 * Configure limits on packet buffering performed before the muxer task is
276 * @param mux_idx index previously returned by sch_add_mux()
277 * @param stream_idx_idx index previously returned by sch_add_mux_stream()
278 * @param data_threshold Total size of the buffered packets' data after which
279 * max_packets applies.
280 * @param max_packets maximum Maximum number of buffered packets after
281 * data_threshold is reached.
283 void sch_mux_stream_buffering(Scheduler
*sch
, unsigned mux_idx
, unsigned stream_idx
,
284 size_t data_threshold
, int max_packets
);
287 * Signal to the scheduler that the specified muxed stream is initialized and
288 * ready. Muxing is started once all the streams are ready.
290 int sch_mux_stream_ready(Scheduler
*sch
, unsigned mux_idx
, unsigned stream_idx
);
293 * Set the file path for the SDP.
295 * The SDP is written when either of the following is true:
296 * - this function is called at least once
297 * - sdp_auto=1 is passed to EVERY call of sch_add_mux()
299 int sch_sdp_filename(Scheduler
*sch
, const char *sdp_filename
);
302 * Add an encoder to the scheduler.
304 * @param func Function executed as the encoding task.
305 * @param ctx Encoder state; will be passed to func and used for logging.
306 * @param open_cb This callback, if specified, will be called when the first
307 * frame is obtained for this encoder. For audio encoders with a
308 * fixed frame size (which use a sync queue in the scheduler to
309 * rechunk frames), it must return that frame size on success.
310 * Otherwise (non-audio, variable frame size) it should return 0.
312 * @retval ">=0" Index of the newly-created encoder.
313 * @retval "<0" Error code.
315 int sch_add_enc(Scheduler
*sch
, SchThreadFunc func
, void *ctx
,
316 int (*open_cb
)(void *func_arg
, const struct AVFrame
*frame
));
319 * Add an pre-encoding sync queue to the scheduler.
321 * @param buf_size_us Sync queue buffering size, passed to sq_alloc().
322 * @param logctx Logging context for the sync queue. passed to sq_alloc().
324 * @retval ">=0" Index of the newly-created sync queue.
325 * @retval "<0" Error code.
327 int sch_add_sq_enc(Scheduler
*sch
, uint64_t buf_size_us
, void *logctx
);
328 int sch_sq_add_enc(Scheduler
*sch
, unsigned sq_idx
, unsigned enc_idx
,
329 int limiting
, uint64_t max_frames
);
331 int sch_connect(Scheduler
*sch
, SchedulerNode src
, SchedulerNode dst
);
333 enum DemuxSendFlags
{
335 * Treat the packet as an EOF for SCH_NODE_TYPE_MUX destinations
336 * send normally to other types.
338 DEMUX_SEND_STREAMCOPY_EOF
= (1 << 0),
342 * Called by demuxer tasks to communicate with their downstreams. The following
344 * - a demuxed packet for the stream identified by pkt->stream_index;
345 * - demuxer discontinuity/reset (e.g. after a seek) - this is signalled by an
346 * empty packet with stream_index=-1.
348 * @param demux_idx demuxer index
349 * @param pkt A demuxed packet to send.
350 * When flushing (i.e. pkt->stream_index=-1 on entry to this
351 * function), on successful return pkt->pts/pkt->time_base will be
352 * set to the maximum end timestamp of any decoded audio stream, or
353 * AV_NOPTS_VALUE if no decoded audio streams are present.
355 * @retval "non-negative value" success
356 * @retval AVERROR_EOF all consumers for the stream are done
357 * @retval AVERROR_EXIT all consumers are done, should terminate demuxing
358 * @retval "anoter negative error code" other failure
360 int sch_demux_send(Scheduler
*sch
, unsigned demux_idx
, struct AVPacket
*pkt
,
364 * Called by decoder tasks to receive a packet for decoding.
366 * @param dec_idx decoder index
367 * @param pkt Input packet will be written here on success.
369 * An empty packet signals that the decoder should be flushed, but
370 * more packets will follow (e.g. after seeking). When a decoder
371 * created with send_end_ts=1 receives a flush packet, it must write
372 * the end timestamp of the stream after flushing to
373 * pkt->pts/time_base on the next call to this function (if any).
375 * @retval "non-negative value" success
376 * @retval AVERROR_EOF no more packets will arrive, should terminate decoding
377 * @retval "another negative error code" other failure
379 int sch_dec_receive(Scheduler
*sch
, unsigned dec_idx
, struct AVPacket
*pkt
);
382 * Called by decoder tasks to send a decoded frame downstream.
384 * @param dec_idx Decoder index previously returned by sch_add_dec().
385 * @param frame Decoded frame; on success it is consumed and cleared by this
388 * @retval ">=0" success
389 * @retval AVERROR_EOF all consumers are done, should terminate decoding
390 * @retval "another negative error code" other failure
392 int sch_dec_send(Scheduler
*sch
, unsigned dec_idx
,
393 unsigned out_idx
, struct AVFrame
*frame
);
396 * Called by filtergraph tasks to obtain frames for filtering. Will wait for a
397 * frame to become available and return it in frame.
399 * Filtergraphs that contain lavfi sources and do not currently require new
400 * input frames should call this function as a means of rate control - then
401 * in_idx should be set equal to nb_inputs on entry to this function.
403 * @param fg_idx Filtergraph index previously returned by sch_add_filtergraph().
404 * @param[in,out] in_idx On input contains the index of the input on which a frame
405 * is most desired. May be set to nb_inputs to signal that
406 * the filtergraph does not need more input currently.
408 * On success, will be replaced with the input index of
409 * the actually returned frame or EOF timestamp.
411 * @retval ">=0" Frame data or EOF timestamp was delivered into frame, in_idx
412 * contains the index of the input it belongs to.
413 * @retval AVERROR(EAGAIN) No frame was returned, the filtergraph should
414 * resume filtering. May only be returned when
415 * in_idx=nb_inputs on entry to this function.
416 * @retval AVERROR_EOF No more frames will arrive, should terminate filtering.
418 int sch_filter_receive(Scheduler
*sch
, unsigned fg_idx
,
419 unsigned *in_idx
, struct AVFrame
*frame
);
421 * Called by filter tasks to signal that a filter input will no longer accept input.
423 * @param fg_idx Filtergraph index previously returned from sch_add_filtergraph().
424 * @param in_idx Index of the input to finish.
426 void sch_filter_receive_finish(Scheduler
*sch
, unsigned fg_idx
, unsigned in_idx
);
429 * Called by filtergraph tasks to send a filtered frame or EOF to consumers.
431 * @param fg_idx Filtergraph index previously returned by sch_add_filtergraph().
432 * @param out_idx Index of the output which produced the frame.
433 * @param frame The frame to send to consumers. When NULL, signals that no more
434 * frames will be produced for the specified output. When non-NULL,
435 * the frame is consumed and cleared by this function on success.
437 * @retval "non-negative value" success
438 * @retval AVERROR_EOF all consumers are done
439 * @retval "anoter negative error code" other failure
441 int sch_filter_send(Scheduler
*sch
, unsigned fg_idx
, unsigned out_idx
,
442 struct AVFrame
*frame
);
444 int sch_filter_command(Scheduler
*sch
, unsigned fg_idx
, struct AVFrame
*frame
);
447 * Called by encoder tasks to obtain frames for encoding. Will wait for a frame
448 * to become available and return it in frame.
450 * @param enc_idx Encoder index previously returned by sch_add_enc().
451 * @param frame Newly-received frame will be stored here on success. Must be
452 * clean on entrance to this function.
454 * @retval 0 A frame was successfully delivered into frame.
455 * @retval AVERROR_EOF No more frames will be delivered, the encoder should
456 * flush everything and terminate.
459 int sch_enc_receive(Scheduler
*sch
, unsigned enc_idx
, struct AVFrame
*frame
);
462 * Called by encoder tasks to send encoded packets downstream.
464 * @param enc_idx Encoder index previously returned by sch_add_enc().
465 * @param pkt An encoded packet; it will be consumed and cleared by this
466 * function on success.
469 * @retval "<0" Error code.
471 int sch_enc_send (Scheduler
*sch
, unsigned enc_idx
, struct AVPacket
*pkt
);
474 * Called by muxer tasks to obtain packets for muxing. Will wait for a packet
475 * for any muxed stream to become available and return it in pkt.
477 * @param mux_idx Muxer index previously returned by sch_add_mux().
478 * @param pkt Newly-received packet will be stored here on success. Must be
479 * clean on entrance to this function.
481 * @retval 0 A packet was successfully delivered into pkt. Its stream_index
482 * corresponds to a stream index previously returned from
483 * sch_add_mux_stream().
484 * @retval AVERROR_EOF When pkt->stream_index is non-negative, this signals that
485 * no more packets will be delivered for this stream index.
486 * Otherwise this indicates that no more packets will be
487 * delivered for any stream and the muxer should therefore
488 * flush everything and terminate.
490 int sch_mux_receive(Scheduler
*sch
, unsigned mux_idx
, struct AVPacket
*pkt
);
493 * Called by muxer tasks to signal that a stream will no longer accept input.
495 * @param stream_idx Stream index previously returned from sch_add_mux_stream().
497 void sch_mux_receive_finish(Scheduler
*sch
, unsigned mux_idx
, unsigned stream_idx
);
499 int sch_mux_sub_heartbeat_add(Scheduler
*sch
, unsigned mux_idx
, unsigned stream_idx
,
501 int sch_mux_sub_heartbeat(Scheduler
*sch
, unsigned mux_idx
, unsigned stream_idx
,
502 const AVPacket
*pkt
);
504 #endif /* FFTOOLS_FFMPEG_SCHED_H */