1 /*
2 * This file is part of FFmpeg.
3 *
4 * FFmpeg is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
8 *
9 * FFmpeg is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with FFmpeg; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17 */
18
19 /**
20 * @file
21 * Slice multithreading support functions
22 * @see doc/multithreading.txt
23 */
24
25 #include "config.h"
26
27 #include "avcodec.h"
28 #include "internal.h"
29 #include "pthread_internal.h"
30 #include "thread.h"
31
32 #include "libavutil/avassert.h"
33 #include "libavutil/common.h"
34 #include "libavutil/cpu.h"
35 #include "libavutil/mem.h"
36 #include "libavutil/thread.h"
37 #include "libavutil/slicethread.h"
38
39 typedef int (action_func)(AVCodecContext *c, void *arg);
40 typedef int (action_func2)(AVCodecContext *c, void *arg, int jobnr, int threadnr);
41 typedef int (main_func)(AVCodecContext *c);
42
43 typedef struct SliceThreadContext {
44 AVSliceThread *thread;
45 action_func *func;
46 action_func2 *func2;
47 main_func *mainfunc;
48 void *args;
49 int *rets;
50 int job_size;
51
52 int *entries;
53 int entries_count;
54 int thread_count;
55 pthread_cond_t *progress_cond;
56 pthread_mutex_t *progress_mutex;
57 } SliceThreadContext;
58
main_function(void * priv)59 static void main_function(void *priv) {
60 AVCodecContext *avctx = priv;
61 SliceThreadContext *c = avctx->internal->thread_ctx;
62 c->mainfunc(avctx);
63 }
64
worker_func(void * priv,int jobnr,int threadnr,int nb_jobs,int nb_threads)65 static void worker_func(void *priv, int jobnr, int threadnr, int nb_jobs, int nb_threads)
66 {
67 AVCodecContext *avctx = priv;
68 SliceThreadContext *c = avctx->internal->thread_ctx;
69 int ret;
70
71 ret = c->func ? c->func(avctx, (char *)c->args + c->job_size * jobnr)
72 : c->func2(avctx, c->args, jobnr, threadnr);
73 if (c->rets)
74 c->rets[jobnr] = ret;
75 }
76
ff_slice_thread_free(AVCodecContext * avctx)77 void ff_slice_thread_free(AVCodecContext *avctx)
78 {
79 SliceThreadContext *c = avctx->internal->thread_ctx;
80 int i;
81
82 avpriv_slicethread_free(&c->thread);
83
84 for (i = 0; i < c->thread_count; i++) {
85 pthread_mutex_destroy(&c->progress_mutex[i]);
86 pthread_cond_destroy(&c->progress_cond[i]);
87 }
88
89 av_freep(&c->entries);
90 av_freep(&c->progress_mutex);
91 av_freep(&c->progress_cond);
92 av_freep(&avctx->internal->thread_ctx);
93 }
94
thread_execute(AVCodecContext * avctx,action_func * func,void * arg,int * ret,int job_count,int job_size)95 static int thread_execute(AVCodecContext *avctx, action_func* func, void *arg, int *ret, int job_count, int job_size)
96 {
97 SliceThreadContext *c = avctx->internal->thread_ctx;
98
99 if (!(avctx->active_thread_type&FF_THREAD_SLICE) || avctx->thread_count <= 1)
100 return avcodec_default_execute(avctx, func, arg, ret, job_count, job_size);
101
102 if (job_count <= 0)
103 return 0;
104
105 c->job_size = job_size;
106 c->args = arg;
107 c->func = func;
108 c->rets = ret;
109
110 avpriv_slicethread_execute(c->thread, job_count, !!c->mainfunc );
111 return 0;
112 }
113
thread_execute2(AVCodecContext * avctx,action_func2 * func2,void * arg,int * ret,int job_count)114 static int thread_execute2(AVCodecContext *avctx, action_func2* func2, void *arg, int *ret, int job_count)
115 {
116 SliceThreadContext *c = avctx->internal->thread_ctx;
117 c->func2 = func2;
118 return thread_execute(avctx, NULL, arg, ret, job_count, 0);
119 }
120
ff_slice_thread_execute_with_mainfunc(AVCodecContext * avctx,action_func2 * func2,main_func * mainfunc,void * arg,int * ret,int job_count)121 int ff_slice_thread_execute_with_mainfunc(AVCodecContext *avctx, action_func2* func2, main_func *mainfunc, void *arg, int *ret, int job_count)
122 {
123 SliceThreadContext *c = avctx->internal->thread_ctx;
124 c->func2 = func2;
125 c->mainfunc = mainfunc;
126 return thread_execute(avctx, NULL, arg, ret, job_count, 0);
127 }
128
ff_slice_thread_init(AVCodecContext * avctx)129 int ff_slice_thread_init(AVCodecContext *avctx)
130 {
131 SliceThreadContext *c;
132 int thread_count = avctx->thread_count;
133 void (*mainfunc)(void *);
134
135 // We cannot do this in the encoder init as the threads are created before
136 if (av_codec_is_encoder(avctx->codec) &&
137 avctx->codec_id == AV_CODEC_ID_MPEG1VIDEO &&
138 avctx->height > 2800)
139 thread_count = avctx->thread_count = 1;
140
141 if (!thread_count) {
142 int nb_cpus = av_cpu_count();
143 if (avctx->height)
144 nb_cpus = FFMIN(nb_cpus, (avctx->height+15)/16);
145 // use number of cores + 1 as thread count if there is more than one
146 if (nb_cpus > 1)
147 thread_count = avctx->thread_count = FFMIN(nb_cpus + 1, MAX_AUTO_THREADS);
148 else
149 thread_count = avctx->thread_count = 1;
150 }
151
152 if (thread_count <= 1) {
153 avctx->active_thread_type = 0;
154 return 0;
155 }
156
157 avctx->internal->thread_ctx = c = av_mallocz(sizeof(*c));
158 mainfunc = avctx->codec->caps_internal & FF_CODEC_CAP_SLICE_THREAD_HAS_MF ? &main_function : NULL;
159 if (!c || (thread_count = avpriv_slicethread_create(&c->thread, avctx, worker_func, mainfunc, thread_count)) <= 1) {
160 if (c)
161 avpriv_slicethread_free(&c->thread);
162 av_freep(&avctx->internal->thread_ctx);
163 avctx->thread_count = 1;
164 avctx->active_thread_type = 0;
165 return 0;
166 }
167 avctx->thread_count = thread_count;
168
169 avctx->execute = thread_execute;
170 avctx->execute2 = thread_execute2;
171 return 0;
172 }
173
ff_thread_report_progress2(AVCodecContext * avctx,int field,int thread,int n)174 void ff_thread_report_progress2(AVCodecContext *avctx, int field, int thread, int n)
175 {
176 SliceThreadContext *p = avctx->internal->thread_ctx;
177 int *entries = p->entries;
178
179 pthread_mutex_lock(&p->progress_mutex[thread]);
180 entries[field] +=n;
181 pthread_cond_signal(&p->progress_cond[thread]);
182 pthread_mutex_unlock(&p->progress_mutex[thread]);
183 }
184
ff_thread_await_progress2(AVCodecContext * avctx,int field,int thread,int shift)185 void ff_thread_await_progress2(AVCodecContext *avctx, int field, int thread, int shift)
186 {
187 SliceThreadContext *p = avctx->internal->thread_ctx;
188 int *entries = p->entries;
189
190 if (!entries || !field) return;
191
192 thread = thread ? thread - 1 : p->thread_count - 1;
193
194 pthread_mutex_lock(&p->progress_mutex[thread]);
195 while ((entries[field - 1] - entries[field]) < shift){
196 pthread_cond_wait(&p->progress_cond[thread], &p->progress_mutex[thread]);
197 }
198 pthread_mutex_unlock(&p->progress_mutex[thread]);
199 }
200
ff_alloc_entries(AVCodecContext * avctx,int count)201 int ff_alloc_entries(AVCodecContext *avctx, int count)
202 {
203 int i;
204
205 if (avctx->active_thread_type & FF_THREAD_SLICE) {
206 SliceThreadContext *p = avctx->internal->thread_ctx;
207
208 if (p->entries) {
209 av_assert0(p->thread_count == avctx->thread_count);
210 av_freep(&p->entries);
211 }
212
213 p->thread_count = avctx->thread_count;
214 p->entries = av_mallocz_array(count, sizeof(int));
215
216 if (!p->progress_mutex) {
217 p->progress_mutex = av_malloc_array(p->thread_count, sizeof(pthread_mutex_t));
218 p->progress_cond = av_malloc_array(p->thread_count, sizeof(pthread_cond_t));
219 }
220
221 if (!p->entries || !p->progress_mutex || !p->progress_cond) {
222 av_freep(&p->entries);
223 av_freep(&p->progress_mutex);
224 av_freep(&p->progress_cond);
225 return AVERROR(ENOMEM);
226 }
227 p->entries_count = count;
228
229 for (i = 0; i < p->thread_count; i++) {
230 pthread_mutex_init(&p->progress_mutex[i], NULL);
231 pthread_cond_init(&p->progress_cond[i], NULL);
232 }
233 }
234
235 return 0;
236 }
237
ff_reset_entries(AVCodecContext * avctx)238 void ff_reset_entries(AVCodecContext *avctx)
239 {
240 SliceThreadContext *p = avctx->internal->thread_ctx;
241 memset(p->entries, 0, p->entries_count * sizeof(int));
242 }
243