When calling ff_alloc_entries, a number of entries are created. They are never freed, as running fate with slice threading and several frames on e.g. fate-hevc-conformance-ENTP_A_Qualcomm_1 would show. Signed-off-by: Michael Niedermayer <michaelni@gmx.at>
		
			
				
	
	
		
			308 lines
		
	
	
		
			8.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			308 lines
		
	
	
		
			8.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * This file is part of FFmpeg.
 | |
|  *
 | |
|  * FFmpeg is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2.1 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * FFmpeg is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with FFmpeg; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 | |
|  */
 | |
| 
 | |
| /**
 | |
|  * @file
 | |
|  * Slice multithreading support functions
 | |
|  * @see doc/multithreading.txt
 | |
|  */
 | |
| 
 | |
| #include "config.h"
 | |
| 
 | |
| #if HAVE_PTHREADS
 | |
| #include <pthread.h>
 | |
| #elif HAVE_W32THREADS
 | |
| #include "compat/w32pthreads.h"
 | |
| #elif HAVE_OS2THREADS
 | |
| #include "compat/os2threads.h"
 | |
| #endif
 | |
| 
 | |
| #include "avcodec.h"
 | |
| #include "internal.h"
 | |
| #include "pthread_internal.h"
 | |
| #include "thread.h"
 | |
| 
 | |
| #include "libavutil/common.h"
 | |
| #include "libavutil/cpu.h"
 | |
| #include "libavutil/mem.h"
 | |
| 
 | |
| typedef int (action_func)(AVCodecContext *c, void *arg);
 | |
| typedef int (action_func2)(AVCodecContext *c, void *arg, int jobnr, int threadnr);
 | |
| 
 | |
| typedef struct SliceThreadContext {
 | |
|     pthread_t *workers;
 | |
|     action_func *func;
 | |
|     action_func2 *func2;
 | |
|     void *args;
 | |
|     int *rets;
 | |
|     int rets_count;
 | |
|     int job_count;
 | |
|     int job_size;
 | |
| 
 | |
|     pthread_cond_t last_job_cond;
 | |
|     pthread_cond_t current_job_cond;
 | |
|     pthread_mutex_t current_job_lock;
 | |
|     unsigned current_execute;
 | |
|     int current_job;
 | |
|     int done;
 | |
| 
 | |
|     int *entries;
 | |
|     int entries_count;
 | |
|     int thread_count;
 | |
|     pthread_cond_t *progress_cond;
 | |
|     pthread_mutex_t *progress_mutex;
 | |
| } SliceThreadContext;
 | |
| 
 | |
| static void* attribute_align_arg worker(void *v)
 | |
| {
 | |
|     AVCodecContext *avctx = v;
 | |
|     SliceThreadContext *c = avctx->internal->thread_ctx;
 | |
|     unsigned last_execute = 0;
 | |
|     int our_job = c->job_count;
 | |
|     int thread_count = avctx->thread_count;
 | |
|     int self_id;
 | |
| 
 | |
|     pthread_mutex_lock(&c->current_job_lock);
 | |
|     self_id = c->current_job++;
 | |
|     for (;;){
 | |
|         while (our_job >= c->job_count) {
 | |
|             if (c->current_job == thread_count + c->job_count)
 | |
|                 pthread_cond_signal(&c->last_job_cond);
 | |
| 
 | |
|             while (last_execute == c->current_execute && !c->done)
 | |
|                 pthread_cond_wait(&c->current_job_cond, &c->current_job_lock);
 | |
|             last_execute = c->current_execute;
 | |
|             our_job = self_id;
 | |
| 
 | |
|             if (c->done) {
 | |
|                 pthread_mutex_unlock(&c->current_job_lock);
 | |
|                 return NULL;
 | |
|             }
 | |
|         }
 | |
|         pthread_mutex_unlock(&c->current_job_lock);
 | |
| 
 | |
|         c->rets[our_job%c->rets_count] = c->func ? c->func(avctx, (char*)c->args + our_job*c->job_size):
 | |
|                                                    c->func2(avctx, c->args, our_job, self_id);
 | |
| 
 | |
|         pthread_mutex_lock(&c->current_job_lock);
 | |
|         our_job = c->current_job++;
 | |
|     }
 | |
| }
 | |
| 
 | |
| void ff_slice_thread_free(AVCodecContext *avctx)
 | |
| {
 | |
|     SliceThreadContext *c = avctx->internal->thread_ctx;
 | |
|     int i;
 | |
| 
 | |
|     pthread_mutex_lock(&c->current_job_lock);
 | |
|     c->done = 1;
 | |
|     pthread_cond_broadcast(&c->current_job_cond);
 | |
|     for (i = 0; i < c->thread_count; i++)
 | |
|         pthread_cond_broadcast(&c->progress_cond[i]);
 | |
|     pthread_mutex_unlock(&c->current_job_lock);
 | |
| 
 | |
|     for (i=0; i<avctx->thread_count; i++)
 | |
|          pthread_join(c->workers[i], NULL);
 | |
| 
 | |
|     for (i = 0; i < c->thread_count; i++) {
 | |
|         pthread_mutex_destroy(&c->progress_mutex[i]);
 | |
|         pthread_cond_destroy(&c->progress_cond[i]);
 | |
|     }
 | |
| 
 | |
|     pthread_mutex_destroy(&c->current_job_lock);
 | |
|     pthread_cond_destroy(&c->current_job_cond);
 | |
|     pthread_cond_destroy(&c->last_job_cond);
 | |
| 
 | |
|     av_freep(&c->entries);
 | |
|     av_freep(&c->progress_mutex);
 | |
|     av_freep(&c->progress_cond);
 | |
| 
 | |
|     av_freep(&c->workers);
 | |
|     av_freep(&avctx->internal->thread_ctx);
 | |
| }
 | |
| 
 | |
| static av_always_inline void thread_park_workers(SliceThreadContext *c, int thread_count)
 | |
| {
 | |
|     while (c->current_job != thread_count + c->job_count)
 | |
|         pthread_cond_wait(&c->last_job_cond, &c->current_job_lock);
 | |
|     pthread_mutex_unlock(&c->current_job_lock);
 | |
| }
 | |
| 
 | |
| static int thread_execute(AVCodecContext *avctx, action_func* func, void *arg, int *ret, int job_count, int job_size)
 | |
| {
 | |
|     SliceThreadContext *c = avctx->internal->thread_ctx;
 | |
|     int dummy_ret;
 | |
| 
 | |
|     if (!(avctx->active_thread_type&FF_THREAD_SLICE) || avctx->thread_count <= 1)
 | |
|         return avcodec_default_execute(avctx, func, arg, ret, job_count, job_size);
 | |
| 
 | |
|     if (job_count <= 0)
 | |
|         return 0;
 | |
| 
 | |
|     pthread_mutex_lock(&c->current_job_lock);
 | |
| 
 | |
|     c->current_job = avctx->thread_count;
 | |
|     c->job_count = job_count;
 | |
|     c->job_size = job_size;
 | |
|     c->args = arg;
 | |
|     c->func = func;
 | |
|     if (ret) {
 | |
|         c->rets = ret;
 | |
|         c->rets_count = job_count;
 | |
|     } else {
 | |
|         c->rets = &dummy_ret;
 | |
|         c->rets_count = 1;
 | |
|     }
 | |
|     c->current_execute++;
 | |
|     pthread_cond_broadcast(&c->current_job_cond);
 | |
| 
 | |
|     thread_park_workers(c, avctx->thread_count);
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static int thread_execute2(AVCodecContext *avctx, action_func2* func2, void *arg, int *ret, int job_count)
 | |
| {
 | |
|     SliceThreadContext *c = avctx->internal->thread_ctx;
 | |
|     c->func2 = func2;
 | |
|     return thread_execute(avctx, NULL, arg, ret, job_count, 0);
 | |
| }
 | |
| 
 | |
| int ff_slice_thread_init(AVCodecContext *avctx)
 | |
| {
 | |
|     int i;
 | |
|     SliceThreadContext *c;
 | |
|     int thread_count = avctx->thread_count;
 | |
| 
 | |
| #if HAVE_W32THREADS
 | |
|     w32thread_init();
 | |
| #endif
 | |
| 
 | |
|     if (!thread_count) {
 | |
|         int nb_cpus = av_cpu_count();
 | |
|         if  (avctx->height)
 | |
|             nb_cpus = FFMIN(nb_cpus, (avctx->height+15)/16);
 | |
|         // use number of cores + 1 as thread count if there is more than one
 | |
|         if (nb_cpus > 1)
 | |
|             thread_count = avctx->thread_count = FFMIN(nb_cpus + 1, MAX_AUTO_THREADS);
 | |
|         else
 | |
|             thread_count = avctx->thread_count = 1;
 | |
|     }
 | |
| 
 | |
|     if (thread_count <= 1) {
 | |
|         avctx->active_thread_type = 0;
 | |
|         return 0;
 | |
|     }
 | |
| 
 | |
|     c = av_mallocz(sizeof(SliceThreadContext));
 | |
|     if (!c)
 | |
|         return -1;
 | |
| 
 | |
|     c->workers = av_mallocz_array(thread_count, sizeof(pthread_t));
 | |
|     if (!c->workers) {
 | |
|         av_free(c);
 | |
|         return -1;
 | |
|     }
 | |
| 
 | |
|     avctx->internal->thread_ctx = c;
 | |
|     c->current_job = 0;
 | |
|     c->job_count = 0;
 | |
|     c->job_size = 0;
 | |
|     c->done = 0;
 | |
|     pthread_cond_init(&c->current_job_cond, NULL);
 | |
|     pthread_cond_init(&c->last_job_cond, NULL);
 | |
|     pthread_mutex_init(&c->current_job_lock, NULL);
 | |
|     pthread_mutex_lock(&c->current_job_lock);
 | |
|     for (i=0; i<thread_count; i++) {
 | |
|         if(pthread_create(&c->workers[i], NULL, worker, avctx)) {
 | |
|            avctx->thread_count = i;
 | |
|            pthread_mutex_unlock(&c->current_job_lock);
 | |
|            ff_thread_free(avctx);
 | |
|            return -1;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     thread_park_workers(c, thread_count);
 | |
| 
 | |
|     avctx->execute = thread_execute;
 | |
|     avctx->execute2 = thread_execute2;
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| void ff_thread_report_progress2(AVCodecContext *avctx, int field, int thread, int n)
 | |
| {
 | |
|     SliceThreadContext *p = avctx->internal->thread_ctx;
 | |
|     int *entries = p->entries;
 | |
| 
 | |
|     pthread_mutex_lock(&p->progress_mutex[thread]);
 | |
|     entries[field] +=n;
 | |
|     pthread_cond_signal(&p->progress_cond[thread]);
 | |
|     pthread_mutex_unlock(&p->progress_mutex[thread]);
 | |
| }
 | |
| 
 | |
| void ff_thread_await_progress2(AVCodecContext *avctx, int field, int thread, int shift)
 | |
| {
 | |
|     SliceThreadContext *p  = avctx->internal->thread_ctx;
 | |
|     int *entries      = p->entries;
 | |
| 
 | |
|     if (!entries || !field) return;
 | |
| 
 | |
|     thread = thread ? thread - 1 : p->thread_count - 1;
 | |
| 
 | |
|     pthread_mutex_lock(&p->progress_mutex[thread]);
 | |
|     while ((entries[field - 1] - entries[field]) < shift){
 | |
|         pthread_cond_wait(&p->progress_cond[thread], &p->progress_mutex[thread]);
 | |
|     }
 | |
|     pthread_mutex_unlock(&p->progress_mutex[thread]);
 | |
| }
 | |
| 
 | |
| int ff_alloc_entries(AVCodecContext *avctx, int count)
 | |
| {
 | |
|     int i;
 | |
| 
 | |
|     if (avctx->active_thread_type & FF_THREAD_SLICE)  {
 | |
|         SliceThreadContext *p = avctx->internal->thread_ctx;
 | |
|         p->thread_count  = avctx->thread_count;
 | |
|         p->entries       = av_mallocz_array(count, sizeof(int));
 | |
| 
 | |
|         p->progress_mutex = av_malloc_array(p->thread_count, sizeof(pthread_mutex_t));
 | |
|         p->progress_cond  = av_malloc_array(p->thread_count, sizeof(pthread_cond_t));
 | |
| 
 | |
|         if (!p->entries || !p->progress_mutex || !p->progress_cond) {
 | |
|             av_freep(&p->entries);
 | |
|             av_freep(&p->progress_mutex);
 | |
|             av_freep(&p->progress_cond);
 | |
|             return AVERROR(ENOMEM);
 | |
|         }
 | |
|         p->entries_count  = count;
 | |
| 
 | |
|         for (i = 0; i < p->thread_count; i++) {
 | |
|             pthread_mutex_init(&p->progress_mutex[i], NULL);
 | |
|             pthread_cond_init(&p->progress_cond[i], NULL);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| void ff_reset_entries(AVCodecContext *avctx)
 | |
| {
 | |
|     SliceThreadContext *p = avctx->internal->thread_ctx;
 | |
|     memset(p->entries, 0, p->entries_count * sizeof(int));
 | |
| }
 |