summaryrefslogtreecommitdiff
path: root/libavcodec/pthread_slice.c (plain)
blob: 60f5b7889190a4da08157ca311fad8c0b226c621
1/*
2 * This file is part of FFmpeg.
3 *
4 * FFmpeg is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
8 *
9 * FFmpeg is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with FFmpeg; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17 */
18
19/**
20 * @file
21 * Slice multithreading support functions
22 * @see doc/multithreading.txt
23 */
24
25#include "config.h"
26
27#include "avcodec.h"
28#include "internal.h"
29#include "pthread_internal.h"
30#include "thread.h"
31
32#include "libavutil/avassert.h"
33#include "libavutil/common.h"
34#include "libavutil/cpu.h"
35#include "libavutil/mem.h"
36#include "libavutil/thread.h"
37
38typedef int (action_func)(AVCodecContext *c, void *arg);
39typedef int (action_func2)(AVCodecContext *c, void *arg, int jobnr, int threadnr);
40
41typedef struct SliceThreadContext {
42 pthread_t *workers;
43 action_func *func;
44 action_func2 *func2;
45 void *args;
46 int *rets;
47 int job_count;
48 int job_size;
49
50 pthread_cond_t last_job_cond;
51 pthread_cond_t current_job_cond;
52 pthread_mutex_t current_job_lock;
53 unsigned current_execute;
54 int current_job;
55 int done;
56
57 int *entries;
58 int entries_count;
59 int thread_count;
60 pthread_cond_t *progress_cond;
61 pthread_mutex_t *progress_mutex;
62} SliceThreadContext;
63
64static void* attribute_align_arg worker(void *v)
65{
66 AVCodecContext *avctx = v;
67 SliceThreadContext *c = avctx->internal->thread_ctx;
68 unsigned last_execute = 0;
69 int our_job = c->job_count;
70 int thread_count = avctx->thread_count;
71 int self_id;
72
73 pthread_mutex_lock(&c->current_job_lock);
74 self_id = c->current_job++;
75 for (;;){
76 int ret;
77 while (our_job >= c->job_count) {
78 if (c->current_job == thread_count + c->job_count)
79 pthread_cond_signal(&c->last_job_cond);
80
81 while (last_execute == c->current_execute && !c->done)
82 pthread_cond_wait(&c->current_job_cond, &c->current_job_lock);
83 last_execute = c->current_execute;
84 our_job = self_id;
85
86 if (c->done) {
87 pthread_mutex_unlock(&c->current_job_lock);
88 return NULL;
89 }
90 }
91 pthread_mutex_unlock(&c->current_job_lock);
92
93 ret = c->func ? c->func(avctx, (char*)c->args + our_job*c->job_size):
94 c->func2(avctx, c->args, our_job, self_id);
95 if (c->rets)
96 c->rets[our_job%c->job_count] = ret;
97
98 pthread_mutex_lock(&c->current_job_lock);
99 our_job = c->current_job++;
100 }
101}
102
103void ff_slice_thread_free(AVCodecContext *avctx)
104{
105 SliceThreadContext *c = avctx->internal->thread_ctx;
106 int i;
107
108 pthread_mutex_lock(&c->current_job_lock);
109 c->done = 1;
110 pthread_cond_broadcast(&c->current_job_cond);
111 for (i = 0; i < c->thread_count; i++)
112 pthread_cond_broadcast(&c->progress_cond[i]);
113 pthread_mutex_unlock(&c->current_job_lock);
114
115 for (i=0; i<avctx->thread_count; i++)
116 pthread_join(c->workers[i], NULL);
117
118 for (i = 0; i < c->thread_count; i++) {
119 pthread_mutex_destroy(&c->progress_mutex[i]);
120 pthread_cond_destroy(&c->progress_cond[i]);
121 }
122
123 pthread_mutex_destroy(&c->current_job_lock);
124 pthread_cond_destroy(&c->current_job_cond);
125 pthread_cond_destroy(&c->last_job_cond);
126
127 av_freep(&c->entries);
128 av_freep(&c->progress_mutex);
129 av_freep(&c->progress_cond);
130
131 av_freep(&c->workers);
132 av_freep(&avctx->internal->thread_ctx);
133}
134
135static av_always_inline void thread_park_workers(SliceThreadContext *c, int thread_count)
136{
137 while (c->current_job != thread_count + c->job_count)
138 pthread_cond_wait(&c->last_job_cond, &c->current_job_lock);
139 pthread_mutex_unlock(&c->current_job_lock);
140}
141
142static int thread_execute(AVCodecContext *avctx, action_func* func, void *arg, int *ret, int job_count, int job_size)
143{
144 SliceThreadContext *c = avctx->internal->thread_ctx;
145
146 if (!(avctx->active_thread_type&FF_THREAD_SLICE) || avctx->thread_count <= 1)
147 return avcodec_default_execute(avctx, func, arg, ret, job_count, job_size);
148
149 if (job_count <= 0)
150 return 0;
151
152 pthread_mutex_lock(&c->current_job_lock);
153
154 c->current_job = avctx->thread_count;
155 c->job_count = job_count;
156 c->job_size = job_size;
157 c->args = arg;
158 c->func = func;
159 c->rets = ret;
160 c->current_execute++;
161 pthread_cond_broadcast(&c->current_job_cond);
162
163 thread_park_workers(c, avctx->thread_count);
164
165 return 0;
166}
167
168static int thread_execute2(AVCodecContext *avctx, action_func2* func2, void *arg, int *ret, int job_count)
169{
170 SliceThreadContext *c = avctx->internal->thread_ctx;
171 c->func2 = func2;
172 return thread_execute(avctx, NULL, arg, ret, job_count, 0);
173}
174
175int ff_slice_thread_init(AVCodecContext *avctx)
176{
177 int i;
178 SliceThreadContext *c;
179 int thread_count = avctx->thread_count;
180
181#if HAVE_W32THREADS
182 w32thread_init();
183#endif
184
185 // We cannot do this in the encoder init as the threads are created before
186 if (av_codec_is_encoder(avctx->codec) &&
187 avctx->codec_id == AV_CODEC_ID_MPEG1VIDEO &&
188 avctx->height > 2800)
189 thread_count = avctx->thread_count = 1;
190
191 if (!thread_count) {
192 int nb_cpus = av_cpu_count();
193 if (avctx->height)
194 nb_cpus = FFMIN(nb_cpus, (avctx->height+15)/16);
195 // use number of cores + 1 as thread count if there is more than one
196 if (nb_cpus > 1)
197 thread_count = avctx->thread_count = FFMIN(nb_cpus + 1, MAX_AUTO_THREADS);
198 else
199 thread_count = avctx->thread_count = 1;
200 }
201
202 if (thread_count <= 1) {
203 avctx->active_thread_type = 0;
204 return 0;
205 }
206
207 c = av_mallocz(sizeof(SliceThreadContext));
208 if (!c)
209 return -1;
210
211 c->workers = av_mallocz_array(thread_count, sizeof(pthread_t));
212 if (!c->workers) {
213 av_free(c);
214 return -1;
215 }
216
217 avctx->internal->thread_ctx = c;
218 c->current_job = 0;
219 c->job_count = 0;
220 c->job_size = 0;
221 c->done = 0;
222 pthread_cond_init(&c->current_job_cond, NULL);
223 pthread_cond_init(&c->last_job_cond, NULL);
224 pthread_mutex_init(&c->current_job_lock, NULL);
225 pthread_mutex_lock(&c->current_job_lock);
226 for (i=0; i<thread_count; i++) {
227 if(pthread_create(&c->workers[i], NULL, worker, avctx)) {
228 avctx->thread_count = i;
229 pthread_mutex_unlock(&c->current_job_lock);
230 ff_thread_free(avctx);
231 return -1;
232 }
233 }
234
235 thread_park_workers(c, thread_count);
236
237 avctx->execute = thread_execute;
238 avctx->execute2 = thread_execute2;
239 return 0;
240}
241
242void ff_thread_report_progress2(AVCodecContext *avctx, int field, int thread, int n)
243{
244 SliceThreadContext *p = avctx->internal->thread_ctx;
245 int *entries = p->entries;
246
247 pthread_mutex_lock(&p->progress_mutex[thread]);
248 entries[field] +=n;
249 pthread_cond_signal(&p->progress_cond[thread]);
250 pthread_mutex_unlock(&p->progress_mutex[thread]);
251}
252
253void ff_thread_await_progress2(AVCodecContext *avctx, int field, int thread, int shift)
254{
255 SliceThreadContext *p = avctx->internal->thread_ctx;
256 int *entries = p->entries;
257
258 if (!entries || !field) return;
259
260 thread = thread ? thread - 1 : p->thread_count - 1;
261
262 pthread_mutex_lock(&p->progress_mutex[thread]);
263 while ((entries[field - 1] - entries[field]) < shift){
264 pthread_cond_wait(&p->progress_cond[thread], &p->progress_mutex[thread]);
265 }
266 pthread_mutex_unlock(&p->progress_mutex[thread]);
267}
268
269int ff_alloc_entries(AVCodecContext *avctx, int count)
270{
271 int i;
272
273 if (avctx->active_thread_type & FF_THREAD_SLICE) {
274 SliceThreadContext *p = avctx->internal->thread_ctx;
275
276 if (p->entries) {
277 av_assert0(p->thread_count == avctx->thread_count);
278 av_freep(&p->entries);
279 }
280
281 p->thread_count = avctx->thread_count;
282 p->entries = av_mallocz_array(count, sizeof(int));
283
284 if (!p->progress_mutex) {
285 p->progress_mutex = av_malloc_array(p->thread_count, sizeof(pthread_mutex_t));
286 p->progress_cond = av_malloc_array(p->thread_count, sizeof(pthread_cond_t));
287 }
288
289 if (!p->entries || !p->progress_mutex || !p->progress_cond) {
290 av_freep(&p->entries);
291 av_freep(&p->progress_mutex);
292 av_freep(&p->progress_cond);
293 return AVERROR(ENOMEM);
294 }
295 p->entries_count = count;
296
297 for (i = 0; i < p->thread_count; i++) {
298 pthread_mutex_init(&p->progress_mutex[i], NULL);
299 pthread_cond_init(&p->progress_cond[i], NULL);
300 }
301 }
302
303 return 0;
304}
305
306void ff_reset_entries(AVCodecContext *avctx)
307{
308 SliceThreadContext *p = avctx->internal->thread_ctx;
309 memset(p->entries, 0, p->entries_count * sizeof(int));
310}
311