/*
- * Copyright (c) 2004 Michael Niedermayer <michaelni@gmx.at>
+ * Copyright (c) 2004 Roman Shaposhnik
*
- * This library is free software; you can redistribute it and/or
+ * Many thanks to Steven M. Schultz for providing clever ideas and
+ * to Michael Niedermayer <michaelni@gmx.at> for writing initial
+ * implementation.
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
- * version 2 of the License, or (at your option) any later version.
+ * version 2.1 of the License, or (at your option) any later version.
*
- * This library is distributed in the hope that it will be useful,
+ * FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
- * License along with this library; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
- *
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
-#include <semaphore.h>
#include <pthread.h>
-//#define DEBUG
-
#include "avcodec.h"
-#include "common.h"
-
-
-typedef struct ThreadContext{
- AVCodecContext *avctx;
- pthread_t thread;
- sem_t work_sem;
- sem_t done_sem;
- int (*func)(AVCodecContext *c, void *arg);
- void *arg;
- int ret;
-}ThreadContext;
-
-static void * thread_func(void *v){
- ThreadContext *c= v;
-
- for(;;){
-//printf("thread_func %X enter wait\n", (int)v); fflush(stdout);
- sem_wait(&c->work_sem);
-//printf("thread_func %X after wait (func=%X)\n", (int)v, (int)c->func); fflush(stdout);
- if(c->func)
- c->ret= c->func(c->avctx, c->arg);
- else
- return NULL;
-//printf("thread_func %X signal complete\n", (int)v); fflush(stdout);
- sem_post(&c->done_sem);
+
+typedef int (action_func)(AVCodecContext *c, void *arg);
+
+typedef struct ThreadContext {
+ pthread_t *workers;
+ action_func *func;
+ void *args;
+ int *rets;
+ int rets_count;
+ int job_count;
+ int job_size;
+
+ pthread_cond_t last_job_cond;
+ pthread_cond_t current_job_cond;
+ pthread_mutex_t current_job_lock;
+ int current_job;
+ int done;
+} ThreadContext;
+
+static void* attribute_align_arg worker(void *v)
+{
+ AVCodecContext *avctx = v;
+ ThreadContext *c = avctx->thread_opaque;
+ int our_job = c->job_count;
+ int thread_count = avctx->thread_count;
+ int self_id;
+
+ pthread_mutex_lock(&c->current_job_lock);
+ self_id = c->current_job++;
+ for (;;){
+ while (our_job >= c->job_count) {
+ if (c->current_job == thread_count + c->job_count)
+ pthread_cond_signal(&c->last_job_cond);
+
+ pthread_cond_wait(&c->current_job_cond, &c->current_job_lock);
+ our_job = self_id;
+
+ if (c->done) {
+ pthread_mutex_unlock(&c->current_job_lock);
+ return NULL;
+ }
+ }
+ pthread_mutex_unlock(&c->current_job_lock);
+
+ c->rets[our_job%c->rets_count] = c->func(avctx, (char*)c->args + our_job*c->job_size);
+
+ pthread_mutex_lock(&c->current_job_lock);
+ our_job = c->current_job++;
}
-
- return NULL;
}
-/**
- * free what has been allocated by avcodec_thread_init().
- * must be called after decoding has finished, especially dont call while avcodec_thread_execute() is running
- */
-void avcodec_thread_free(AVCodecContext *s){
- ThreadContext *c= s->thread_opaque;
+static av_always_inline void avcodec_thread_park_workers(ThreadContext *c, int thread_count)
+{
+ pthread_cond_wait(&c->last_job_cond, &c->current_job_lock);
+ pthread_mutex_unlock(&c->current_job_lock);
+}
+
+void avcodec_thread_free(AVCodecContext *avctx)
+{
+ ThreadContext *c = avctx->thread_opaque;
int i;
- for(i=0; i<s->thread_count; i++){
- int val;
-
- sem_getvalue(&c[i].work_sem, &val); assert(val == 0);
- sem_getvalue(&c[i].done_sem, &val); assert(val == 0);
-
- c[i].func= NULL;
- sem_post(&c[i].work_sem);
- pthread_join(c[i].thread, NULL);
- sem_destroy(&c[i].work_sem);
- sem_destroy(&c[i].done_sem);
- }
+ pthread_mutex_lock(&c->current_job_lock);
+ c->done = 1;
+ pthread_cond_broadcast(&c->current_job_cond);
+ pthread_mutex_unlock(&c->current_job_lock);
- av_freep(&s->thread_opaque);
+ for (i=0; i<avctx->thread_count; i++)
+ pthread_join(c->workers[i], NULL);
+
+ pthread_mutex_destroy(&c->current_job_lock);
+ pthread_cond_destroy(&c->current_job_cond);
+ pthread_cond_destroy(&c->last_job_cond);
+ av_free(c->workers);
+ av_freep(&avctx->thread_opaque);
}
-int avcodec_thread_execute(AVCodecContext *s, int (*func)(AVCodecContext *c2, void *arg2),void **arg, int *ret, int count){
- ThreadContext *c= s->thread_opaque;
- int i, val;
-
- assert(s == c->avctx);
- assert(count <= s->thread_count);
-
- /* note, we can be certain that this is not called with the same AVCodecContext by different threads at the same time */
-
- for(i=0; i<count; i++){
- sem_getvalue(&c[i].work_sem, &val); assert(val == 0);
- sem_getvalue(&c[i].done_sem, &val); assert(val == 0);
-
- c[i].arg= arg[i];
- c[i].func= func;
- c[i].ret= 12345;
- sem_post(&c[i].work_sem);
- }
- for(i=0; i<count; i++){
- sem_wait(&c[i].done_sem);
-
- sem_getvalue(&c[i].work_sem, &val); assert(val == 0);
- sem_getvalue(&c[i].done_sem, &val); assert(val == 0);
-
- c[i].func= NULL;
- if(ret) ret[i]= c[i].ret;
+int avcodec_thread_execute(AVCodecContext *avctx, action_func* func, void *arg, int *ret, int job_count, int job_size)
+{
+ ThreadContext *c= avctx->thread_opaque;
+ int dummy_ret;
+
+ if (job_count <= 0)
+ return 0;
+
+ pthread_mutex_lock(&c->current_job_lock);
+
+ c->current_job = avctx->thread_count;
+ c->job_count = job_count;
+ c->job_size = job_size;
+ c->args = arg;
+ c->func = func;
+ if (ret) {
+ c->rets = ret;
+ c->rets_count = job_count;
+ } else {
+ c->rets = &dummy_ret;
+ c->rets_count = 1;
}
+ pthread_cond_broadcast(&c->current_job_cond);
+
+ avcodec_thread_park_workers(c, avctx->thread_count);
+
return 0;
}
-int avcodec_thread_init(AVCodecContext *s, int thread_count){
+int avcodec_thread_init(AVCodecContext *avctx, int thread_count)
+{
int i;
ThreadContext *c;
- s->thread_count= thread_count;
-
- assert(!s->thread_opaque);
- c= av_mallocz(sizeof(ThreadContext)*thread_count);
- s->thread_opaque= c;
-
- for(i=0; i<thread_count; i++){
-//printf("init semaphors %d\n", i); fflush(stdout);
- c[i].avctx= s;
- if(sem_init(&c[i].work_sem, 0, 0))
- goto fail;
- if(sem_init(&c[i].done_sem, 0, 0))
- goto fail;
-//printf("create thread %d\n", i); fflush(stdout);
- if(pthread_create(&c[i].thread, NULL, thread_func, &c[i]))
- goto fail;
+ c = av_mallocz(sizeof(ThreadContext));
+ if (!c)
+ return -1;
+
+ c->workers = av_mallocz(sizeof(pthread_t)*thread_count);
+ if (!c->workers) {
+ av_free(c);
+ return -1;
+ }
+
+ avctx->thread_opaque = c;
+ avctx->thread_count = thread_count;
+ c->current_job = 0;
+ c->job_count = 0;
+ c->job_size = 0;
+ c->done = 0;
+ pthread_cond_init(&c->current_job_cond, NULL);
+ pthread_cond_init(&c->last_job_cond, NULL);
+ pthread_mutex_init(&c->current_job_lock, NULL);
+ pthread_mutex_lock(&c->current_job_lock);
+ for (i=0; i<thread_count; i++) {
+ if(pthread_create(&c->workers[i], NULL, worker, avctx)) {
+ avctx->thread_count = i;
+ pthread_mutex_unlock(&c->current_job_lock);
+ avcodec_thread_free(avctx);
+ return -1;
+ }
}
-//printf("init done\n"); fflush(stdout);
-
- s->execute= avcodec_thread_execute;
+ avcodec_thread_park_workers(c, thread_count);
+
+ avctx->execute = avcodec_thread_execute;
return 0;
-fail:
- avcodec_thread_free(s);
- return -1;
}