ffmpeg / libavcodec / pthread.c @ 05fa64a7
History | View | Annotate | Download (27.2 KB)
1 |
/*
|
---|---|
2 |
* Copyright (c) 2004 Roman Shaposhnik
|
3 |
* Copyright (c) 2008 Alexander Strange (astrange@ithinksw.com)
|
4 |
*
|
5 |
* Many thanks to Steven M. Schultz for providing clever ideas and
|
6 |
* to Michael Niedermayer <michaelni@gmx.at> for writing initial
|
7 |
* implementation.
|
8 |
*
|
9 |
* This file is part of FFmpeg.
|
10 |
*
|
11 |
* FFmpeg is free software; you can redistribute it and/or
|
12 |
* modify it under the terms of the GNU Lesser General Public
|
13 |
* License as published by the Free Software Foundation; either
|
14 |
* version 2.1 of the License, or (at your option) any later version.
|
15 |
*
|
16 |
* FFmpeg is distributed in the hope that it will be useful,
|
17 |
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
18 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
19 |
* Lesser General Public License for more details.
|
20 |
*
|
21 |
* You should have received a copy of the GNU Lesser General Public
|
22 |
* License along with FFmpeg; if not, write to the Free Software
|
23 |
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
24 |
*/
|
25 |
|
26 |
/**
|
27 |
* @file
|
28 |
* Multithreading support functions
|
29 |
* @see doc/multithreading.txt
|
30 |
*/
|
31 |
|
32 |
#include <pthread.h> |
33 |
|
34 |
#include "avcodec.h" |
35 |
#include "thread.h" |
36 |
|
37 |
typedef int (action_func)(AVCodecContext *c, void *arg); |
38 |
typedef int (action_func2)(AVCodecContext *c, void *arg, int jobnr, int threadnr); |
39 |
|
40 |
typedef struct ThreadContext { |
41 |
pthread_t *workers; |
42 |
action_func *func; |
43 |
action_func2 *func2; |
44 |
void *args;
|
45 |
int *rets;
|
46 |
int rets_count;
|
47 |
int job_count;
|
48 |
int job_size;
|
49 |
|
50 |
pthread_cond_t last_job_cond; |
51 |
pthread_cond_t current_job_cond; |
52 |
pthread_mutex_t current_job_lock; |
53 |
int current_job;
|
54 |
int done;
|
55 |
} ThreadContext; |
56 |
|
57 |
/// Max number of frame buffers that can be allocated when using frame threads.
|
58 |
#define MAX_BUFFERS 32 |
59 |
|
60 |
/**
|
61 |
* Context used by codec threads and stored in their AVCodecContext thread_opaque.
|
62 |
*/
|
63 |
typedef struct PerThreadContext { |
64 |
struct FrameThreadContext *parent;
|
65 |
|
66 |
pthread_t thread; |
67 |
pthread_cond_t input_cond; ///< Used to wait for a new packet from the main thread.
|
68 |
pthread_cond_t progress_cond; ///< Used by child threads to wait for progress to change.
|
69 |
pthread_cond_t output_cond; ///< Used by the main thread to wait for frames to finish.
|
70 |
|
71 |
pthread_mutex_t mutex; ///< Mutex used to protect the contents of the PerThreadContext.
|
72 |
pthread_mutex_t progress_mutex; ///< Mutex used to protect frame progress values and progress_cond.
|
73 |
|
74 |
AVCodecContext *avctx; ///< Context used to decode packets passed to this thread.
|
75 |
|
76 |
AVPacket avpkt; ///< Input packet (for decoding) or output (for encoding).
|
77 |
int allocated_buf_size; ///< Size allocated for avpkt.data |
78 |
|
79 |
AVFrame frame; ///< Output frame (for decoding) or input (for encoding).
|
80 |
int got_frame; ///< The output of got_picture_ptr from the last avcodec_decode_video() call. |
81 |
int result; ///< The result of the last codec decode/encode() call. |
82 |
|
83 |
enum {
|
84 |
STATE_INPUT_READY, ///< Set when the thread is awaiting a packet.
|
85 |
STATE_SETTING_UP, ///< Set before the codec has called ff_thread_finish_setup().
|
86 |
STATE_GET_BUFFER, /**<
|
87 |
* Set when the codec calls get_buffer().
|
88 |
* State is returned to STATE_SETTING_UP afterwards.
|
89 |
*/
|
90 |
STATE_SETUP_FINISHED ///< Set after the codec has called ff_thread_finish_setup().
|
91 |
} state; |
92 |
|
93 |
/**
|
94 |
* Array of frames passed to ff_thread_release_buffer().
|
95 |
* Frames are released after all threads referencing them are finished.
|
96 |
*/
|
97 |
AVFrame released_buffers[MAX_BUFFERS]; |
98 |
int num_released_buffers;
|
99 |
|
100 |
/**
|
101 |
* Array of progress values used by ff_thread_get_buffer().
|
102 |
*/
|
103 |
int progress[MAX_BUFFERS][2]; |
104 |
uint8_t progress_used[MAX_BUFFERS]; |
105 |
|
106 |
AVFrame *requested_frame; ///< AVFrame the codec passed to get_buffer()
|
107 |
} PerThreadContext; |
108 |
|
109 |
/**
|
110 |
* Context stored in the client AVCodecContext thread_opaque.
|
111 |
*/
|
112 |
typedef struct FrameThreadContext { |
113 |
PerThreadContext *threads; ///< The contexts for each thread.
|
114 |
PerThreadContext *prev_thread; ///< The last thread submit_packet() was called on.
|
115 |
|
116 |
pthread_mutex_t buffer_mutex; ///< Mutex used to protect get/release_buffer().
|
117 |
|
118 |
int next_decoding; ///< The next context to submit a packet to. |
119 |
int next_finished; ///< The next context to return output from. |
120 |
|
121 |
int delaying; /**< |
122 |
* Set for the first N packets, where N is the number of threads.
|
123 |
* While it is set, ff_thread_en/decode_frame won't return any results.
|
124 |
*/
|
125 |
|
126 |
int die; ///< Set when threads should exit. |
127 |
} FrameThreadContext; |
128 |
|
129 |
static void* attribute_align_arg worker(void *v) |
130 |
{ |
131 |
AVCodecContext *avctx = v; |
132 |
ThreadContext *c = avctx->thread_opaque; |
133 |
int our_job = c->job_count;
|
134 |
int thread_count = avctx->thread_count;
|
135 |
int self_id;
|
136 |
|
137 |
pthread_mutex_lock(&c->current_job_lock); |
138 |
self_id = c->current_job++; |
139 |
for (;;){
|
140 |
while (our_job >= c->job_count) {
|
141 |
if (c->current_job == thread_count + c->job_count)
|
142 |
pthread_cond_signal(&c->last_job_cond); |
143 |
|
144 |
pthread_cond_wait(&c->current_job_cond, &c->current_job_lock); |
145 |
our_job = self_id; |
146 |
|
147 |
if (c->done) {
|
148 |
pthread_mutex_unlock(&c->current_job_lock); |
149 |
return NULL; |
150 |
} |
151 |
} |
152 |
pthread_mutex_unlock(&c->current_job_lock); |
153 |
|
154 |
c->rets[our_job%c->rets_count] = c->func ? c->func(avctx, (char*)c->args + our_job*c->job_size):
|
155 |
c->func2(avctx, c->args, our_job, self_id); |
156 |
|
157 |
pthread_mutex_lock(&c->current_job_lock); |
158 |
our_job = c->current_job++; |
159 |
} |
160 |
} |
161 |
|
162 |
static av_always_inline void avcodec_thread_park_workers(ThreadContext *c, int thread_count) |
163 |
{ |
164 |
pthread_cond_wait(&c->last_job_cond, &c->current_job_lock); |
165 |
pthread_mutex_unlock(&c->current_job_lock); |
166 |
} |
167 |
|
168 |
static void thread_free(AVCodecContext *avctx) |
169 |
{ |
170 |
ThreadContext *c = avctx->thread_opaque; |
171 |
int i;
|
172 |
|
173 |
pthread_mutex_lock(&c->current_job_lock); |
174 |
c->done = 1;
|
175 |
pthread_cond_broadcast(&c->current_job_cond); |
176 |
pthread_mutex_unlock(&c->current_job_lock); |
177 |
|
178 |
for (i=0; i<avctx->thread_count; i++) |
179 |
pthread_join(c->workers[i], NULL);
|
180 |
|
181 |
pthread_mutex_destroy(&c->current_job_lock); |
182 |
pthread_cond_destroy(&c->current_job_cond); |
183 |
pthread_cond_destroy(&c->last_job_cond); |
184 |
av_free(c->workers); |
185 |
av_freep(&avctx->thread_opaque); |
186 |
} |
187 |
|
188 |
static int avcodec_thread_execute(AVCodecContext *avctx, action_func* func, void *arg, int *ret, int job_count, int job_size) |
189 |
{ |
190 |
ThreadContext *c= avctx->thread_opaque; |
191 |
int dummy_ret;
|
192 |
|
193 |
if (!(avctx->active_thread_type&FF_THREAD_SLICE) || avctx->thread_count <= 1) |
194 |
return avcodec_default_execute(avctx, func, arg, ret, job_count, job_size);
|
195 |
|
196 |
if (job_count <= 0) |
197 |
return 0; |
198 |
|
199 |
pthread_mutex_lock(&c->current_job_lock); |
200 |
|
201 |
c->current_job = avctx->thread_count; |
202 |
c->job_count = job_count; |
203 |
c->job_size = job_size; |
204 |
c->args = arg; |
205 |
c->func = func; |
206 |
if (ret) {
|
207 |
c->rets = ret; |
208 |
c->rets_count = job_count; |
209 |
} else {
|
210 |
c->rets = &dummy_ret; |
211 |
c->rets_count = 1;
|
212 |
} |
213 |
pthread_cond_broadcast(&c->current_job_cond); |
214 |
|
215 |
avcodec_thread_park_workers(c, avctx->thread_count); |
216 |
|
217 |
return 0; |
218 |
} |
219 |
|
220 |
static int avcodec_thread_execute2(AVCodecContext *avctx, action_func2* func2, void *arg, int *ret, int job_count) |
221 |
{ |
222 |
ThreadContext *c= avctx->thread_opaque; |
223 |
c->func2 = func2; |
224 |
return avcodec_thread_execute(avctx, NULL, arg, ret, job_count, 0); |
225 |
} |
226 |
|
227 |
static int thread_init(AVCodecContext *avctx) |
228 |
{ |
229 |
int i;
|
230 |
ThreadContext *c; |
231 |
int thread_count = avctx->thread_count;
|
232 |
|
233 |
if (thread_count <= 1) |
234 |
return 0; |
235 |
|
236 |
c = av_mallocz(sizeof(ThreadContext));
|
237 |
if (!c)
|
238 |
return -1; |
239 |
|
240 |
c->workers = av_mallocz(sizeof(pthread_t)*thread_count);
|
241 |
if (!c->workers) {
|
242 |
av_free(c); |
243 |
return -1; |
244 |
} |
245 |
|
246 |
avctx->thread_opaque = c; |
247 |
c->current_job = 0;
|
248 |
c->job_count = 0;
|
249 |
c->job_size = 0;
|
250 |
c->done = 0;
|
251 |
pthread_cond_init(&c->current_job_cond, NULL);
|
252 |
pthread_cond_init(&c->last_job_cond, NULL);
|
253 |
pthread_mutex_init(&c->current_job_lock, NULL);
|
254 |
pthread_mutex_lock(&c->current_job_lock); |
255 |
for (i=0; i<thread_count; i++) { |
256 |
if(pthread_create(&c->workers[i], NULL, worker, avctx)) { |
257 |
avctx->thread_count = i; |
258 |
pthread_mutex_unlock(&c->current_job_lock); |
259 |
ff_thread_free(avctx); |
260 |
return -1; |
261 |
} |
262 |
} |
263 |
|
264 |
avcodec_thread_park_workers(c, thread_count); |
265 |
|
266 |
avctx->execute = avcodec_thread_execute; |
267 |
avctx->execute2 = avcodec_thread_execute2; |
268 |
return 0; |
269 |
} |
270 |
|
271 |
/**
|
272 |
* Codec worker thread.
|
273 |
*
|
274 |
* Automatically calls ff_thread_finish_setup() if the codec does
|
275 |
* not provide an update_thread_context method, or if the codec returns
|
276 |
* before calling it.
|
277 |
*/
|
278 |
static attribute_align_arg void *frame_worker_thread(void *arg) |
279 |
{ |
280 |
PerThreadContext *p = arg; |
281 |
FrameThreadContext *fctx = p->parent; |
282 |
AVCodecContext *avctx = p->avctx; |
283 |
AVCodec *codec = avctx->codec; |
284 |
|
285 |
while (1) { |
286 |
if (p->state == STATE_INPUT_READY && !fctx->die) {
|
287 |
pthread_mutex_lock(&p->mutex); |
288 |
while (p->state == STATE_INPUT_READY && !fctx->die)
|
289 |
pthread_cond_wait(&p->input_cond, &p->mutex); |
290 |
pthread_mutex_unlock(&p->mutex); |
291 |
} |
292 |
|
293 |
if (fctx->die) break; |
294 |
|
295 |
if (!codec->update_thread_context && avctx->thread_safe_callbacks)
|
296 |
ff_thread_finish_setup(avctx); |
297 |
|
298 |
pthread_mutex_lock(&p->mutex); |
299 |
avcodec_get_frame_defaults(&p->frame); |
300 |
p->got_frame = 0;
|
301 |
p->result = codec->decode(avctx, &p->frame, &p->got_frame, &p->avpkt); |
302 |
|
303 |
if (p->state == STATE_SETTING_UP) ff_thread_finish_setup(avctx);
|
304 |
|
305 |
p->state = STATE_INPUT_READY; |
306 |
|
307 |
pthread_mutex_lock(&p->progress_mutex); |
308 |
pthread_cond_signal(&p->output_cond); |
309 |
pthread_mutex_unlock(&p->progress_mutex); |
310 |
|
311 |
pthread_mutex_unlock(&p->mutex); |
312 |
} |
313 |
|
314 |
return NULL; |
315 |
} |
316 |
|
317 |
/**
|
318 |
* Updates the next thread's AVCodecContext with values from the reference thread's context.
|
319 |
*
|
320 |
* @param dst The destination context.
|
321 |
* @param src The source context.
|
322 |
* @param for_user 0 if the destination is a codec thread, 1 if the destination is the user's thread
|
323 |
*/
|
324 |
static int update_context_from_thread(AVCodecContext *dst, AVCodecContext *src, int for_user) |
325 |
{ |
326 |
int err = 0; |
327 |
|
328 |
if (dst != src) {
|
329 |
dst->sub_id = src->sub_id; |
330 |
dst->time_base = src->time_base; |
331 |
dst->width = src->width; |
332 |
dst->height = src->height; |
333 |
dst->pix_fmt = src->pix_fmt; |
334 |
|
335 |
dst->has_b_frames = src->has_b_frames; |
336 |
dst->idct_algo = src->idct_algo; |
337 |
dst->slice_count = src->slice_count; |
338 |
|
339 |
dst->bits_per_coded_sample = src->bits_per_coded_sample; |
340 |
dst->sample_aspect_ratio = src->sample_aspect_ratio; |
341 |
dst->dtg_active_format = src->dtg_active_format; |
342 |
|
343 |
dst->profile = src->profile; |
344 |
dst->level = src->level; |
345 |
|
346 |
dst->bits_per_raw_sample = src->bits_per_raw_sample; |
347 |
dst->ticks_per_frame = src->ticks_per_frame; |
348 |
dst->color_primaries = src->color_primaries; |
349 |
|
350 |
dst->color_trc = src->color_trc; |
351 |
dst->colorspace = src->colorspace; |
352 |
dst->color_range = src->color_range; |
353 |
dst->chroma_sample_location = src->chroma_sample_location; |
354 |
} |
355 |
|
356 |
if (for_user) {
|
357 |
dst->coded_frame = src->coded_frame; |
358 |
dst->has_b_frames += src->thread_count - 1;
|
359 |
} else {
|
360 |
if (dst->codec->update_thread_context)
|
361 |
err = dst->codec->update_thread_context(dst, src); |
362 |
} |
363 |
|
364 |
return err;
|
365 |
} |
366 |
|
367 |
/**
|
368 |
* Update the next thread's AVCodecContext with values set by the user.
|
369 |
*
|
370 |
* @param dst The destination context.
|
371 |
* @param src The source context.
|
372 |
*/
|
373 |
static void update_context_from_user(AVCodecContext *dst, AVCodecContext *src) |
374 |
{ |
375 |
#define copy_fields(s, e) memcpy(&dst->s, &src->s, (char*)&dst->e - (char*)&dst->s); |
376 |
dst->flags = src->flags; |
377 |
|
378 |
dst->draw_horiz_band= src->draw_horiz_band; |
379 |
dst->get_buffer = src->get_buffer; |
380 |
dst->release_buffer = src->release_buffer; |
381 |
|
382 |
dst->opaque = src->opaque; |
383 |
dst->hurry_up = src->hurry_up; |
384 |
dst->dsp_mask = src->dsp_mask; |
385 |
dst->debug = src->debug; |
386 |
dst->debug_mv = src->debug_mv; |
387 |
|
388 |
dst->slice_flags = src->slice_flags; |
389 |
dst->flags2 = src->flags2; |
390 |
|
391 |
copy_fields(skip_loop_filter, bidir_refine); |
392 |
|
393 |
dst->frame_number = src->frame_number; |
394 |
dst->reordered_opaque = src->reordered_opaque; |
395 |
#undef copy_fields
|
396 |
} |
397 |
|
398 |
static void free_progress(AVFrame *f) |
399 |
{ |
400 |
PerThreadContext *p = f->owner->thread_opaque; |
401 |
int *progress = f->thread_opaque;
|
402 |
|
403 |
p->progress_used[(progress - p->progress[0]) / 2] = 0; |
404 |
} |
405 |
|
406 |
/// Releases the buffers that this decoding thread was the last user of.
|
407 |
static void release_delayed_buffers(PerThreadContext *p) |
408 |
{ |
409 |
FrameThreadContext *fctx = p->parent; |
410 |
|
411 |
while (p->num_released_buffers > 0) { |
412 |
AVFrame *f = &p->released_buffers[--p->num_released_buffers]; |
413 |
|
414 |
pthread_mutex_lock(&fctx->buffer_mutex); |
415 |
free_progress(f); |
416 |
f->thread_opaque = NULL;
|
417 |
|
418 |
f->owner->release_buffer(f->owner, f); |
419 |
pthread_mutex_unlock(&fctx->buffer_mutex); |
420 |
} |
421 |
} |
422 |
|
423 |
static int submit_packet(PerThreadContext *p, AVPacket *avpkt) |
424 |
{ |
425 |
FrameThreadContext *fctx = p->parent; |
426 |
PerThreadContext *prev_thread = fctx->prev_thread; |
427 |
AVCodec *codec = p->avctx->codec; |
428 |
uint8_t *buf = p->avpkt.data; |
429 |
|
430 |
if (!avpkt->size && !(codec->capabilities & CODEC_CAP_DELAY)) return 0; |
431 |
|
432 |
pthread_mutex_lock(&p->mutex); |
433 |
|
434 |
release_delayed_buffers(p); |
435 |
|
436 |
if (prev_thread) {
|
437 |
int err;
|
438 |
if (prev_thread->state == STATE_SETTING_UP) {
|
439 |
pthread_mutex_lock(&prev_thread->progress_mutex); |
440 |
while (prev_thread->state == STATE_SETTING_UP)
|
441 |
pthread_cond_wait(&prev_thread->progress_cond, &prev_thread->progress_mutex); |
442 |
pthread_mutex_unlock(&prev_thread->progress_mutex); |
443 |
} |
444 |
|
445 |
err = update_context_from_thread(p->avctx, prev_thread->avctx, 0);
|
446 |
if (err) {
|
447 |
pthread_mutex_unlock(&p->mutex); |
448 |
return err;
|
449 |
} |
450 |
} |
451 |
|
452 |
av_fast_malloc(&buf, &p->allocated_buf_size, avpkt->size + FF_INPUT_BUFFER_PADDING_SIZE); |
453 |
p->avpkt = *avpkt; |
454 |
p->avpkt.data = buf; |
455 |
memcpy(buf, avpkt->data, avpkt->size); |
456 |
memset(buf + avpkt->size, 0, FF_INPUT_BUFFER_PADDING_SIZE);
|
457 |
|
458 |
p->state = STATE_SETTING_UP; |
459 |
pthread_cond_signal(&p->input_cond); |
460 |
pthread_mutex_unlock(&p->mutex); |
461 |
|
462 |
/*
|
463 |
* If the client doesn't have a thread-safe get_buffer(),
|
464 |
* then decoding threads call back to the main thread,
|
465 |
* and it calls back to the client here.
|
466 |
*/
|
467 |
|
468 |
if (!p->avctx->thread_safe_callbacks &&
|
469 |
p->avctx->get_buffer != avcodec_default_get_buffer) { |
470 |
while (p->state != STATE_SETUP_FINISHED && p->state != STATE_INPUT_READY) {
|
471 |
pthread_mutex_lock(&p->progress_mutex); |
472 |
while (p->state == STATE_SETTING_UP)
|
473 |
pthread_cond_wait(&p->progress_cond, &p->progress_mutex); |
474 |
|
475 |
if (p->state == STATE_GET_BUFFER) {
|
476 |
p->result = p->avctx->get_buffer(p->avctx, p->requested_frame); |
477 |
p->state = STATE_SETTING_UP; |
478 |
pthread_cond_signal(&p->progress_cond); |
479 |
} |
480 |
pthread_mutex_unlock(&p->progress_mutex); |
481 |
} |
482 |
} |
483 |
|
484 |
fctx->prev_thread = p; |
485 |
|
486 |
return 0; |
487 |
} |
488 |
|
489 |
int ff_thread_decode_frame(AVCodecContext *avctx,
|
490 |
AVFrame *picture, int *got_picture_ptr,
|
491 |
AVPacket *avpkt) |
492 |
{ |
493 |
FrameThreadContext *fctx = avctx->thread_opaque; |
494 |
int finished = fctx->next_finished;
|
495 |
PerThreadContext *p; |
496 |
int err;
|
497 |
|
498 |
/*
|
499 |
* Submit a packet to the next decoding thread.
|
500 |
*/
|
501 |
|
502 |
p = &fctx->threads[fctx->next_decoding]; |
503 |
update_context_from_user(p->avctx, avctx); |
504 |
err = submit_packet(p, avpkt); |
505 |
if (err) return err; |
506 |
|
507 |
fctx->next_decoding++; |
508 |
|
509 |
/*
|
510 |
* If we're still receiving the initial packets, don't return a frame.
|
511 |
*/
|
512 |
|
513 |
if (fctx->delaying && avpkt->size) {
|
514 |
if (fctx->next_decoding >= (avctx->thread_count-1)) fctx->delaying = 0; |
515 |
|
516 |
*got_picture_ptr=0;
|
517 |
return 0; |
518 |
} |
519 |
|
520 |
/*
|
521 |
* Return the next available frame from the oldest thread.
|
522 |
* If we're at the end of the stream, then we have to skip threads that
|
523 |
* didn't output a frame, because we don't want to accidentally signal
|
524 |
* EOF (avpkt->size == 0 && *got_picture_ptr == 0).
|
525 |
*/
|
526 |
|
527 |
do {
|
528 |
p = &fctx->threads[finished++]; |
529 |
|
530 |
if (p->state != STATE_INPUT_READY) {
|
531 |
pthread_mutex_lock(&p->progress_mutex); |
532 |
while (p->state != STATE_INPUT_READY)
|
533 |
pthread_cond_wait(&p->output_cond, &p->progress_mutex); |
534 |
pthread_mutex_unlock(&p->progress_mutex); |
535 |
} |
536 |
|
537 |
*picture = p->frame; |
538 |
*got_picture_ptr = p->got_frame; |
539 |
picture->pkt_dts = p->avpkt.dts; |
540 |
|
541 |
/*
|
542 |
* A later call with avkpt->size == 0 may loop over all threads,
|
543 |
* including this one, searching for a frame to return before being
|
544 |
* stopped by the "finished != fctx->next_finished" condition.
|
545 |
* Make sure we don't mistakenly return the same frame again.
|
546 |
*/
|
547 |
p->got_frame = 0;
|
548 |
|
549 |
if (finished >= avctx->thread_count) finished = 0; |
550 |
} while (!avpkt->size && !*got_picture_ptr && finished != fctx->next_finished);
|
551 |
|
552 |
update_context_from_thread(avctx, p->avctx, 1);
|
553 |
|
554 |
if (fctx->next_decoding >= avctx->thread_count) fctx->next_decoding = 0; |
555 |
|
556 |
fctx->next_finished = finished; |
557 |
|
558 |
return p->result;
|
559 |
} |
560 |
|
561 |
void ff_thread_report_progress(AVFrame *f, int n, int field) |
562 |
{ |
563 |
PerThreadContext *p; |
564 |
int *progress = f->thread_opaque;
|
565 |
|
566 |
if (!progress || progress[field] >= n) return; |
567 |
|
568 |
p = f->owner->thread_opaque; |
569 |
|
570 |
if (f->owner->debug&FF_DEBUG_THREADS)
|
571 |
av_log(f->owner, AV_LOG_DEBUG, "%p finished %d field %d\n", progress, n, field);
|
572 |
|
573 |
pthread_mutex_lock(&p->progress_mutex); |
574 |
progress[field] = n; |
575 |
pthread_cond_broadcast(&p->progress_cond); |
576 |
pthread_mutex_unlock(&p->progress_mutex); |
577 |
} |
578 |
|
579 |
void ff_thread_await_progress(AVFrame *f, int n, int field) |
580 |
{ |
581 |
PerThreadContext *p; |
582 |
int *progress = f->thread_opaque;
|
583 |
|
584 |
if (!progress || progress[field] >= n) return; |
585 |
|
586 |
p = f->owner->thread_opaque; |
587 |
|
588 |
if (f->owner->debug&FF_DEBUG_THREADS)
|
589 |
av_log(f->owner, AV_LOG_DEBUG, "thread awaiting %d field %d from %p\n", n, field, progress);
|
590 |
|
591 |
pthread_mutex_lock(&p->progress_mutex); |
592 |
while (progress[field] < n)
|
593 |
pthread_cond_wait(&p->progress_cond, &p->progress_mutex); |
594 |
pthread_mutex_unlock(&p->progress_mutex); |
595 |
} |
596 |
|
597 |
void ff_thread_finish_setup(AVCodecContext *avctx) {
|
598 |
PerThreadContext *p = avctx->thread_opaque; |
599 |
|
600 |
if (!(avctx->active_thread_type&FF_THREAD_FRAME)) return; |
601 |
|
602 |
pthread_mutex_lock(&p->progress_mutex); |
603 |
p->state = STATE_SETUP_FINISHED; |
604 |
pthread_cond_broadcast(&p->progress_cond); |
605 |
pthread_mutex_unlock(&p->progress_mutex); |
606 |
} |
607 |
|
608 |
/// Waits for all threads to finish.
|
609 |
static void park_frame_worker_threads(FrameThreadContext *fctx, int thread_count) |
610 |
{ |
611 |
int i;
|
612 |
|
613 |
for (i = 0; i < thread_count; i++) { |
614 |
PerThreadContext *p = &fctx->threads[i]; |
615 |
|
616 |
if (p->state != STATE_INPUT_READY) {
|
617 |
pthread_mutex_lock(&p->progress_mutex); |
618 |
while (p->state != STATE_INPUT_READY)
|
619 |
pthread_cond_wait(&p->output_cond, &p->progress_mutex); |
620 |
pthread_mutex_unlock(&p->progress_mutex); |
621 |
} |
622 |
} |
623 |
} |
624 |
|
625 |
static void frame_thread_free(AVCodecContext *avctx, int thread_count) |
626 |
{ |
627 |
FrameThreadContext *fctx = avctx->thread_opaque; |
628 |
AVCodec *codec = avctx->codec; |
629 |
int i;
|
630 |
|
631 |
park_frame_worker_threads(fctx, thread_count); |
632 |
|
633 |
if (fctx->prev_thread)
|
634 |
update_context_from_thread(fctx->threads->avctx, fctx->prev_thread->avctx, 0);
|
635 |
|
636 |
fctx->die = 1;
|
637 |
|
638 |
for (i = 0; i < thread_count; i++) { |
639 |
PerThreadContext *p = &fctx->threads[i]; |
640 |
|
641 |
pthread_mutex_lock(&p->mutex); |
642 |
pthread_cond_signal(&p->input_cond); |
643 |
pthread_mutex_unlock(&p->mutex); |
644 |
|
645 |
pthread_join(p->thread, NULL);
|
646 |
|
647 |
if (codec->close)
|
648 |
codec->close(p->avctx); |
649 |
|
650 |
avctx->codec = NULL;
|
651 |
|
652 |
release_delayed_buffers(p); |
653 |
} |
654 |
|
655 |
for (i = 0; i < thread_count; i++) { |
656 |
PerThreadContext *p = &fctx->threads[i]; |
657 |
|
658 |
avcodec_default_free_buffers(p->avctx); |
659 |
|
660 |
pthread_mutex_destroy(&p->mutex); |
661 |
pthread_mutex_destroy(&p->progress_mutex); |
662 |
pthread_cond_destroy(&p->input_cond); |
663 |
pthread_cond_destroy(&p->progress_cond); |
664 |
pthread_cond_destroy(&p->output_cond); |
665 |
av_freep(&p->avpkt.data); |
666 |
|
667 |
if (i)
|
668 |
av_freep(&p->avctx->priv_data); |
669 |
|
670 |
av_freep(&p->avctx); |
671 |
} |
672 |
|
673 |
av_freep(&fctx->threads); |
674 |
pthread_mutex_destroy(&fctx->buffer_mutex); |
675 |
av_freep(&avctx->thread_opaque); |
676 |
} |
677 |
|
678 |
static int frame_thread_init(AVCodecContext *avctx) |
679 |
{ |
680 |
int thread_count = avctx->thread_count;
|
681 |
AVCodec *codec = avctx->codec; |
682 |
AVCodecContext *src = avctx; |
683 |
FrameThreadContext *fctx; |
684 |
int i, err = 0; |
685 |
|
686 |
avctx->thread_opaque = fctx = av_mallocz(sizeof(FrameThreadContext));
|
687 |
|
688 |
fctx->threads = av_mallocz(sizeof(PerThreadContext) * thread_count);
|
689 |
pthread_mutex_init(&fctx->buffer_mutex, NULL);
|
690 |
fctx->delaying = 1;
|
691 |
|
692 |
for (i = 0; i < thread_count; i++) { |
693 |
AVCodecContext *copy = av_malloc(sizeof(AVCodecContext));
|
694 |
PerThreadContext *p = &fctx->threads[i]; |
695 |
|
696 |
pthread_mutex_init(&p->mutex, NULL);
|
697 |
pthread_mutex_init(&p->progress_mutex, NULL);
|
698 |
pthread_cond_init(&p->input_cond, NULL);
|
699 |
pthread_cond_init(&p->progress_cond, NULL);
|
700 |
pthread_cond_init(&p->output_cond, NULL);
|
701 |
|
702 |
p->parent = fctx; |
703 |
p->avctx = copy; |
704 |
|
705 |
*copy = *src; |
706 |
copy->thread_opaque = p; |
707 |
copy->pkt = &p->avpkt; |
708 |
|
709 |
if (!i) {
|
710 |
src = copy; |
711 |
|
712 |
if (codec->init)
|
713 |
err = codec->init(copy); |
714 |
|
715 |
update_context_from_thread(avctx, copy, 1);
|
716 |
} else {
|
717 |
copy->is_copy = 1;
|
718 |
copy->priv_data = av_malloc(codec->priv_data_size); |
719 |
memcpy(copy->priv_data, src->priv_data, codec->priv_data_size); |
720 |
|
721 |
if (codec->init_thread_copy)
|
722 |
err = codec->init_thread_copy(copy); |
723 |
} |
724 |
|
725 |
if (err) goto error; |
726 |
|
727 |
pthread_create(&p->thread, NULL, frame_worker_thread, p);
|
728 |
} |
729 |
|
730 |
return 0; |
731 |
|
732 |
error:
|
733 |
frame_thread_free(avctx, i+1);
|
734 |
|
735 |
return err;
|
736 |
} |
737 |
|
738 |
void ff_thread_flush(AVCodecContext *avctx)
|
739 |
{ |
740 |
FrameThreadContext *fctx = avctx->thread_opaque; |
741 |
|
742 |
if (!avctx->thread_opaque) return; |
743 |
|
744 |
park_frame_worker_threads(fctx, avctx->thread_count); |
745 |
|
746 |
if (fctx->prev_thread)
|
747 |
update_context_from_thread(fctx->threads->avctx, fctx->prev_thread->avctx, 0);
|
748 |
|
749 |
fctx->next_decoding = fctx->next_finished = 0;
|
750 |
fctx->delaying = 1;
|
751 |
fctx->prev_thread = NULL;
|
752 |
} |
753 |
|
754 |
static int *allocate_progress(PerThreadContext *p) |
755 |
{ |
756 |
int i;
|
757 |
|
758 |
for (i = 0; i < MAX_BUFFERS; i++) |
759 |
if (!p->progress_used[i]) break; |
760 |
|
761 |
if (i == MAX_BUFFERS) {
|
762 |
av_log(p->avctx, AV_LOG_ERROR, "allocate_progress() overflow\n");
|
763 |
return NULL; |
764 |
} |
765 |
|
766 |
p->progress_used[i] = 1;
|
767 |
|
768 |
return p->progress[i];
|
769 |
} |
770 |
|
771 |
int ff_thread_get_buffer(AVCodecContext *avctx, AVFrame *f)
|
772 |
{ |
773 |
PerThreadContext *p = avctx->thread_opaque; |
774 |
int *progress, err;
|
775 |
|
776 |
f->owner = avctx; |
777 |
|
778 |
if (!(avctx->active_thread_type&FF_THREAD_FRAME)) {
|
779 |
f->thread_opaque = NULL;
|
780 |
return avctx->get_buffer(avctx, f);
|
781 |
} |
782 |
|
783 |
if (p->state != STATE_SETTING_UP &&
|
784 |
(avctx->codec->update_thread_context || !avctx->thread_safe_callbacks)) { |
785 |
av_log(avctx, AV_LOG_ERROR, "get_buffer() cannot be called after ff_thread_finish_setup()\n");
|
786 |
return -1; |
787 |
} |
788 |
|
789 |
pthread_mutex_lock(&p->parent->buffer_mutex); |
790 |
f->thread_opaque = progress = allocate_progress(p); |
791 |
|
792 |
if (!progress) {
|
793 |
pthread_mutex_unlock(&p->parent->buffer_mutex); |
794 |
return -1; |
795 |
} |
796 |
|
797 |
progress[0] =
|
798 |
progress[1] = -1; |
799 |
|
800 |
if (avctx->thread_safe_callbacks ||
|
801 |
avctx->get_buffer == avcodec_default_get_buffer) { |
802 |
err = avctx->get_buffer(avctx, f); |
803 |
} else {
|
804 |
p->requested_frame = f; |
805 |
p->state = STATE_GET_BUFFER; |
806 |
pthread_mutex_lock(&p->progress_mutex); |
807 |
pthread_cond_signal(&p->progress_cond); |
808 |
|
809 |
while (p->state != STATE_SETTING_UP)
|
810 |
pthread_cond_wait(&p->progress_cond, &p->progress_mutex); |
811 |
|
812 |
err = p->result; |
813 |
|
814 |
pthread_mutex_unlock(&p->progress_mutex); |
815 |
|
816 |
if (!avctx->codec->update_thread_context)
|
817 |
ff_thread_finish_setup(avctx); |
818 |
} |
819 |
|
820 |
pthread_mutex_unlock(&p->parent->buffer_mutex); |
821 |
|
822 |
/*
|
823 |
* Buffer age is difficult to keep track of between
|
824 |
* multiple threads, and the optimizations it allows
|
825 |
* are not worth the effort. It is disabled for now.
|
826 |
*/
|
827 |
f->age = INT_MAX; |
828 |
|
829 |
return err;
|
830 |
} |
831 |
|
832 |
void ff_thread_release_buffer(AVCodecContext *avctx, AVFrame *f)
|
833 |
{ |
834 |
PerThreadContext *p = avctx->thread_opaque; |
835 |
|
836 |
if (!(avctx->active_thread_type&FF_THREAD_FRAME)) {
|
837 |
avctx->release_buffer(avctx, f); |
838 |
return;
|
839 |
} |
840 |
|
841 |
if (p->num_released_buffers >= MAX_BUFFERS) {
|
842 |
av_log(p->avctx, AV_LOG_ERROR, "too many thread_release_buffer calls!\n");
|
843 |
return;
|
844 |
} |
845 |
|
846 |
if(avctx->debug & FF_DEBUG_BUFFERS)
|
847 |
av_log(avctx, AV_LOG_DEBUG, "thread_release_buffer called on pic %p, %d buffers used\n",
|
848 |
f, f->owner->internal_buffer_count); |
849 |
|
850 |
p->released_buffers[p->num_released_buffers++] = *f; |
851 |
memset(f->data, 0, sizeof(f->data)); |
852 |
} |
853 |
|
854 |
/**
|
855 |
* Set the threading algorithms used.
|
856 |
*
|
857 |
* Threading requires more than one thread.
|
858 |
* Frame threading requires entire frames to be passed to the codec,
|
859 |
* and introduces extra decoding delay, so is incompatible with low_delay.
|
860 |
*
|
861 |
* @param avctx The context.
|
862 |
*/
|
863 |
static void validate_thread_parameters(AVCodecContext *avctx) |
864 |
{ |
865 |
int frame_threading_supported = (avctx->codec->capabilities & CODEC_CAP_FRAME_THREADS)
|
866 |
&& !(avctx->flags & CODEC_FLAG_TRUNCATED) |
867 |
&& !(avctx->flags & CODEC_FLAG_LOW_DELAY) |
868 |
&& !(avctx->flags2 & CODEC_FLAG2_CHUNKS); |
869 |
if (avctx->thread_count == 1) { |
870 |
avctx->active_thread_type = 0;
|
871 |
} else if (frame_threading_supported && (avctx->thread_type & FF_THREAD_FRAME)) { |
872 |
avctx->active_thread_type = FF_THREAD_FRAME; |
873 |
} else {
|
874 |
avctx->active_thread_type = FF_THREAD_SLICE; |
875 |
} |
876 |
} |
877 |
|
878 |
int ff_thread_init(AVCodecContext *avctx, int thread_count) |
879 |
{ |
880 |
if (avctx->thread_opaque) {
|
881 |
av_log(avctx, AV_LOG_ERROR, "avcodec_thread_init is ignored after avcodec_open\n");
|
882 |
return -1; |
883 |
} |
884 |
|
885 |
avctx->thread_count = FFMAX(1, thread_count);
|
886 |
|
887 |
if (avctx->codec) {
|
888 |
validate_thread_parameters(avctx); |
889 |
|
890 |
if (avctx->active_thread_type&FF_THREAD_SLICE)
|
891 |
return thread_init(avctx);
|
892 |
else if (avctx->active_thread_type&FF_THREAD_FRAME) |
893 |
return frame_thread_init(avctx);
|
894 |
} |
895 |
|
896 |
return 0; |
897 |
} |
898 |
|
899 |
void ff_thread_free(AVCodecContext *avctx)
|
900 |
{ |
901 |
if (avctx->active_thread_type&FF_THREAD_FRAME)
|
902 |
frame_thread_free(avctx, avctx->thread_count); |
903 |
else
|
904 |
thread_free(avctx); |
905 |
} |