annotate libavcodec/h264_ompss.c @ 7:c8259123d224

hide animating VP and entry point
author Nina Engelhardt <nengel@mailbox.tu-berlin.de>
date Wed, 15 May 2013 15:26:14 +0200
parents 55fb61482128
children 6c1433f5a562
rev   line source
nengel@2 1 /*
nengel@2 2 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder
nengel@2 3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
nengel@2 4 *
nengel@2 5 * This file is part of FFmpeg.
nengel@2 6 *
nengel@2 7 * FFmpeg is free software; you can redistribute it and/or
nengel@2 8 * modify it under the terms of the GNU Lesser General Public
nengel@2 9 * License as published by the Free Software Foundation; either
nengel@2 10 * version 2.1 of the License, or (at your option) any later version.
nengel@2 11 *
nengel@2 12 * FFmpeg is distributed in the hope that it will be useful,
nengel@2 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nengel@2 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
nengel@2 15 * Lesser General Public License for more details.
nengel@2 16 *
nengel@2 17 * You should have received a copy of the GNU Lesser General Public
nengel@2 18 * License along with FFmpeg; if not, write to the Free Software
nengel@2 19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
nengel@2 20 */
nengel@2 21 #include "h264_types.h"
nengel@2 22 #include "h264_parser.h"
nengel@2 23 #include "h264_nal.h"
nengel@2 24 #include "h264_entropy.h"
nengel@2 25 #include "h264_rec.h"
nengel@2 26 #include "h264_pred_mode.h"
nengel@2 27 #include "h264_misc.h"
nengel@2 28 // #undef NDEBUG
nengel@2 29 #include <assert.h>
nengel@3 30 #include "VSs_impl/VSs.h"
nengel@2 31
nengel@3 32 typedef struct{
nengel@3 33 ParserContext *pc;
nengel@3 34 NalContext *nc;
nengel@3 35 SliceBufferEntry *sbe;
nengel@3 36 H264Context *h;
nengel@3 37 } parse_taskArgs;
nengel@3 38
nengel@3 39 int32 parse_taskArgTypes[4] = {INOUT, INOUT, OUTPUT, NONCTLD};
nengel@3 40 int32 parse_taskArgSizes[4] = {sizeof(ParserContext), sizeof(NalContext), sizeof(SliceBufferEntry), sizeof(H264Context)};
nengel@3 41
nengel@3 42 //#pragma omp task inout(*pc, *nc) output(*sbe)
nengel@7 43 static void parse_task(void *_data){
nengel@3 44 parse_taskArgs* args = (parse_taskArgs*) _data;
nengel@3 45 ParserContext *pc = args->pc;
nengel@3 46 NalContext *nc = args->nc;
nengel@3 47 SliceBufferEntry *sbe = args->sbe;
nengel@3 48 H264Context *h = args->h;
nengel@2 49 H264Slice *s;
nengel@2 50
nengel@2 51 if (!sbe->initialized){
nengel@2 52 init_sb_entry(h, sbe);
nengel@2 53 sbe->lines_total=h->mb_height;
nengel@2 54 }
nengel@2 55
nengel@2 56 av_read_frame_internal(pc, &sbe->gb);
nengel@2 57 s = &sbe->slice;
nengel@2 58
nengel@2 59 decode_nal_units(nc, s, &sbe->gb);
nengel@3 60
nengel@7 61 VSs__end_task();
nengel@2 62 }
nengel@2 63
nengel@3 64 VSsTaskType parse_taskType = {
nengel@3 65 .fn = &parse_task,
nengel@3 66 .numCtldArgs = 3,
nengel@3 67 .numTotalArgs = 4,
nengel@3 68 .sizeOfArgs = sizeof(parse_taskArgs),
nengel@3 69 .argTypes = parse_taskArgTypes,
nengel@3 70 .argSizes = parse_taskArgSizes};
nengel@3 71
nengel@3 72
nengel@3 73 typedef struct{
nengel@3 74 EntropyContext *ec;
nengel@3 75 SliceBufferEntry *sbe;
nengel@3 76 H264Context *h;
nengel@3 77 } decode_slice_entropy_taskArgs;
nengel@3 78
nengel@3 79 int32 decode_slice_entropy_taskArgTypes[3] = {INOUT, INOUT, NONCTLD};
nengel@3 80 int32 decode_slice_entropy_taskArgSizes[3] = {sizeof(EntropyContext), sizeof(SliceBufferEntry), sizeof(H264Context)};
nengel@3 81
nengel@3 82 //#pragma omp task inout(*ec) inout(*sbe)
nengel@7 83 static void decode_slice_entropy_task(void *_data){
nengel@3 84 decode_slice_entropy_taskArgs* args = (decode_slice_entropy_taskArgs*) _data;
nengel@3 85 EntropyContext *ec = args->ec;
nengel@3 86 SliceBufferEntry *sbe = args->sbe;
nengel@3 87 H264Context *h = args->h;
nengel@2 88 int i,j;
nengel@2 89 H264Slice *s = &sbe->slice;
nengel@2 90 GetBitContext *gb = &sbe->gb;
nengel@2 91 H264Mb *mbs = sbe->mbs;
nengel@2 92 // GetBitContext *gb = s->gb;
nengel@2 93 CABACContext *c = &ec->c;
nengel@2 94
nengel@2 95 if( !s->pps.cabac ){
nengel@2 96 av_log(AV_LOG_ERROR, "Only cabac encoded streams are supported\n");
nengel@7 97 VSs__end_task();
nengel@2 98 }
nengel@2 99
nengel@2 100 init_dequant_tables(s, ec);
nengel@2 101 ec->curr_qscale = s->qscale;
nengel@2 102 ec->last_qscale_diff = 0;
nengel@2 103 ec->chroma_qp[0] = get_chroma_qp((H264Slice *) s, 0, s->qscale);
nengel@2 104 ec->chroma_qp[1] = get_chroma_qp((H264Slice *) s, 1, s->qscale);
nengel@2 105
nengel@2 106 /* realign */
nengel@2 107 align_get_bits( gb );
nengel@2 108 /* init cabac */
nengel@2 109 ff_init_cabac_decoder( c, gb->buffer + get_bits_count(gb)/8, (get_bits_left(gb) + 7)/8);
nengel@2 110
nengel@2 111 ff_h264_init_cabac_states(ec, s, c);
nengel@2 112
nengel@2 113 for(j=0; j<ec->mb_height; j++){
nengel@2 114 init_entropy_buf(ec, s, j);
nengel@2 115 for(i=0; i<ec->mb_width; i++){
nengel@2 116 int eos,ret;
nengel@2 117 H264Mb *m = &mbs[i + j*ec->mb_width];
nengel@2 118 m->mb_x=i;
nengel@2 119 m->mb_y=j;
nengel@2 120 ec->m = m;
nengel@2 121
nengel@2 122 ret = ff_h264_decode_mb_cabac(ec, s, c);
nengel@2 123 eos = get_cabac_terminate( c);
nengel@2 124 (void) eos;
nengel@2 125 if( ret < 0 || c->bytestream > c->bytestream_end + 2) {
nengel@2 126 av_log(AV_LOG_ERROR, "error while decoding MB %d %d, bytestream (%td)\n", m->mb_x, m->mb_y, c->bytestream_end - c->bytestream);
nengel@7 127 VSs__end_task();
nengel@2 128 }
nengel@2 129 }
nengel@2 130 }
nengel@7 131 VSs__end_task();
nengel@2 132 }
nengel@2 133
nengel@3 134 VSsTaskType decode_slice_entropy_taskType = {
nengel@3 135 .fn = &decode_slice_entropy_task,
nengel@3 136 .numCtldArgs = 2,
nengel@3 137 .numTotalArgs = 3,
nengel@3 138 .sizeOfArgs = sizeof(decode_slice_entropy_taskArgs),
nengel@3 139 .argTypes = decode_slice_entropy_taskArgTypes,
nengel@3 140 .argSizes = decode_slice_entropy_taskArgSizes};
nengel@3 141
nengel@3 142
nengel@2 143 static void decode_super_mb_block(MBRecContext *d, H264Slice *s, SuperMBContext *smbc, H264Mb *mbs, int smb_x, int smb_y){
nengel@2 144 MBRecState mrs;
nengel@2 145 // memset(&mrs, 0, sizeof(MBRecState));
nengel@2 146
nengel@2 147 for (int k=0, i= smb_y; i< smb_y + smbc->smb_height; i++, k++){
nengel@2 148 init_mbrec_context(d, &mrs, s, i);
nengel@2 149 for (int j= smb_x -k ; j< smb_x - k + smbc->smb_width; j++){
nengel@2 150 if (i< d->mb_height && j >= 0 && j < d->mb_width){
nengel@2 151 h264_decode_mb_internal (d, &mrs, s, &mbs[i*d->mb_width+j]);
nengel@2 152 }
nengel@2 153 }
nengel@2 154 }
nengel@2 155 }
nengel@2 156
nengel@3 157 typedef struct{
nengel@3 158 MBRecContext *d;
nengel@3 159 SliceBufferEntry *sbe;
nengel@3 160 SuperMBTask *ml;
nengel@3 161 SuperMBTask *mur;
nengel@3 162 SuperMBTask *m;
nengel@3 163 SuperMBContext *smbc;
nengel@3 164 } decode_super_mb_taskArgs;
nengel@3 165
nengel@3 166 int32 decode_super_mb_taskArgTypes[6] = {IN, IN, IN, IN, INOUT, NONCTLD};
nengel@3 167 int32 decode_super_mb_taskArgSizes[6] = {sizeof(MBRecContext), sizeof(SliceBufferEntry), sizeof(SuperMBTask), sizeof(SuperMBTask), sizeof(SuperMBTask), sizeof(SuperMBContext)};
nengel@3 168
nengel@3 169 //#pragma omp task input(*d, *sbe, *ml, *mur) inout(*m)
nengel@7 170 static void decode_super_mb_task(void *_data){
nengel@3 171 decode_super_mb_taskArgs* args = (decode_super_mb_taskArgs*) _data;
nengel@3 172 MBRecContext *d = args->d;
nengel@3 173 SliceBufferEntry *sbe = args->sbe;
nengel@3 174 SuperMBTask *ml = args->ml;
nengel@3 175 SuperMBTask *mur = args->mur;
nengel@3 176 SuperMBTask *m = args->m;
nengel@3 177 SuperMBContext *smbc = args->smbc;
nengel@2 178 H264Slice *s = &sbe->slice;
nengel@2 179 H264Mb *mbs = sbe->mbs;
nengel@2 180 decode_super_mb_block(d, s, smbc, mbs, m->smb_x, m->smb_y);
nengel@7 181 VSs__end_task();
nengel@2 182 }
nengel@2 183
nengel@3 184 VSsTaskType decode_super_mb_taskType = {
nengel@3 185 .fn = &decode_super_mb_task,
nengel@3 186 .numCtldArgs = 5,
nengel@3 187 .numTotalArgs = 6,
nengel@3 188 .sizeOfArgs = sizeof(decode_super_mb_taskArgs),
nengel@3 189 .argTypes = decode_super_mb_taskArgTypes,
nengel@3 190 .argSizes = decode_super_mb_taskArgSizes};
nengel@3 191
nengel@3 192
nengel@3 193
nengel@3 194 typedef struct{
nengel@3 195 MBRecContext *d;
nengel@3 196 SliceBufferEntry *sbe;
nengel@3 197 SuperMBTask *sm;
nengel@3 198 SuperMBContext *smbc;
nengel@3 199 int* line;
nengel@3 200 } draw_edges_taskArgs;
nengel@3 201
nengel@3 202 int32 draw_edges_taskArgTypes[5] = {IN, IN, INOUT, NONCTLD, NONCTLD};
nengel@3 203 int32 draw_edges_taskArgSizes[5] = {sizeof(MBRecContext), sizeof(SliceBufferEntry), sizeof(SuperMBTask),sizeof(SuperMBContext),sizeof(int)};
nengel@3 204
nengel@3 205 //#pragma omp task input(*d, *sbe) inout(*sm)
nengel@7 206 static void draw_edges_task(void *_data){
nengel@3 207 draw_edges_taskArgs* args = (draw_edges_taskArgs*) _data;
nengel@3 208 MBRecContext *d = args->d;
nengel@3 209 SliceBufferEntry *sbe = args->sbe;
nengel@3 210 SuperMBTask *sm = args->sm;
nengel@3 211 SuperMBContext *smbc = args->smbc;
nengel@3 212 int line = *(args->line);
nengel@2 213 H264Slice *s = &sbe->slice;
nengel@2 214 for (int i=line*smbc->smb_height; i< (line+1)*smbc->smb_height && i< d->mb_height; i++)
nengel@2 215 draw_edges(d, s, i);
nengel@6 216 VMS_App__free(args->line);
nengel@7 217 VSs__end_task();
nengel@2 218 }
nengel@3 219 VSsTaskType draw_edges_taskType = {
nengel@3 220 .fn = &draw_edges_task,
nengel@3 221 .numCtldArgs = 3,
nengel@3 222 .numTotalArgs = 5,
nengel@3 223 .sizeOfArgs = sizeof(draw_edges_taskArgs),
nengel@3 224 .argTypes = draw_edges_taskArgTypes,
nengel@3 225 .argSizes = draw_edges_taskArgSizes};
nengel@2 226
nengel@3 227
nengel@7 228 static void decode_mb_in_slice(H264Context *h, MBRecContext *d, SliceBufferEntry *sbe){
nengel@2 229 int i,j;
nengel@2 230
nengel@2 231 SuperMBContext *smbc = acquire_smbc(h);
nengel@2 232 int smb_height =smbc->nsmb_height, smb_width= smbc->nsmb_width;
nengel@2 233 SuperMBTask *smbs = smbc->smbs[0];
nengel@2 234
nengel@2 235 SuperMBTask *sm=NULL, *sml, *smur;
nengel@2 236 for(j=0; j< smb_height; j++){
nengel@2 237 for(i=0; i< smb_width; i++){
nengel@2 238 sm = smbs + j*smb_width + i;
nengel@2 239 sml = sm - ((i > 0) ? 1: 0);
nengel@2 240 smur = sm + (((i < smb_width-1) && (j >0)) ? -smb_width+1: 0);
nengel@3 241 decode_super_mb_taskArgs decode_super_mb_task_args;
nengel@3 242 decode_super_mb_task_args.d = d;
nengel@3 243 decode_super_mb_task_args.sbe = sbe;
nengel@3 244 decode_super_mb_task_args.smbc = smbc;
nengel@3 245 decode_super_mb_task_args.ml = sml;
nengel@3 246 decode_super_mb_task_args.mur = smur;
nengel@3 247 decode_super_mb_task_args.m = sm;
nengel@7 248 VSs__submit_task(&decode_super_mb_taskType, &decode_super_mb_task_args);
nengel@2 249 }
nengel@3 250 draw_edges_taskArgs draw_edges_task_args;
nengel@3 251 draw_edges_task_args.d = d;
nengel@3 252 draw_edges_task_args.sbe = sbe;
nengel@3 253 draw_edges_task_args.sm = sm;
nengel@3 254 draw_edges_task_args.smbc = smbc;
nengel@3 255 draw_edges_task_args.line = VMS_App__malloc( sizeof(int) );
nengel@3 256 *(draw_edges_task_args.line) = j;
nengel@7 257 VSs__submit_task(&draw_edges_taskType, &draw_edges_task_args);
nengel@2 258 }
nengel@7 259 VSs__taskwait_on(sm);
nengel@3 260 //#pragma omp taskwait on(*sm)
nengel@2 261
nengel@2 262 release_smbc(h, smbc);
nengel@2 263 }
nengel@2 264
nengel@3 265 typedef struct{
nengel@3 266 MBRecContext *d;
nengel@3 267 SliceBufferEntry *sbe;
nengel@3 268 H264Context *h;
nengel@3 269 } decode_slice_mb_taskArgs;
nengel@3 270
nengel@3 271 int32 decode_slice_mb_taskArgTypes[3] = {INOUT, INOUT, NONCTLD};
nengel@3 272 int32 decode_slice_mb_taskArgSizes[3] = {sizeof(MBRecContext), sizeof(SliceBufferEntry), sizeof(H264Context)};
nengel@3 273
nengel@3 274 //#pragma omp task inout(*d) inout(*sbe)
nengel@7 275 static void decode_slice_mb_task(void *_data){
nengel@3 276 decode_slice_mb_taskArgs* args = (decode_slice_mb_taskArgs*) _data;
nengel@3 277 MBRecContext *d = args->d;
nengel@3 278 SliceBufferEntry *sbe = args->sbe;
nengel@3 279 H264Context *h = args->h;
nengel@3 280
nengel@2 281 H264Slice *s = &sbe->slice;
nengel@2 282
nengel@2 283 for (int i=0; i<2; i++){
nengel@2 284 for(int j=0; j< s->ref_count[i]; j++){
nengel@2 285 if (s->ref_list_cpn[i][j] ==-1)
nengel@2 286 continue;
nengel@2 287 int k;
nengel@2 288 for (k=0; k< h->max_dpb_cnt; k++){
nengel@2 289 if(h->dpb[k].reference >= 2 && h->dpb[k].cpn == s->ref_list_cpn[i][j]){
nengel@2 290 s->dp_ref_list[i][j] = &h->dpb[k];
nengel@2 291 break;
nengel@2 292 }
nengel@2 293 }
nengel@2 294 }
nengel@2 295 }
nengel@2 296
nengel@3 297 //#pragma omp critical (dpb)
nengel@7 298 VSs__start_critical(0);
nengel@2 299 get_dpb_entry(h, s);
nengel@7 300 VSs__end_critical(0);
nengel@3 301
nengel@2 302 if (!h->no_mbd){
nengel@7 303 decode_mb_in_slice (h, d, sbe);
nengel@2 304 }
nengel@2 305
nengel@2 306 for (int i=0; i<s->release_cnt; i++){
nengel@2 307 for(int j=0; j<h->max_dpb_cnt; j++){
nengel@2 308 if(h->dpb[j].cpn== s->release_ref_cpn[i]){
nengel@3 309 //#pragma omp critical (dpb)
nengel@7 310 VSs__start_critical(0);
nengel@2 311 release_dpb_entry(h, &h->dpb[j], 2);
nengel@7 312 VSs__end_critical(0);
nengel@2 313 break;
nengel@2 314 }
nengel@2 315 }
nengel@2 316 }
nengel@2 317 s->release_cnt=0;
nengel@7 318 VSs__end_task();
nengel@2 319 }
nengel@2 320
nengel@3 321 VSsTaskType decode_slice_mb_taskType = {
nengel@3 322 .fn = &decode_slice_mb_task,
nengel@3 323 .numCtldArgs = 2,
nengel@3 324 .numTotalArgs = 3,
nengel@3 325 .sizeOfArgs = sizeof(decode_slice_mb_taskArgs),
nengel@3 326 .argTypes = decode_slice_mb_taskArgTypes,
nengel@3 327 .argSizes = decode_slice_mb_taskArgSizes};
nengel@3 328
nengel@2 329 // for static 3d wave
nengel@2 330 /*-------------------------------------------------------------------------------*/
nengel@3 331 typedef struct{
nengel@3 332 MBRecContext *d;
nengel@3 333 SliceBufferEntry *sbe;
nengel@3 334 SuperMBTask *ml;
nengel@3 335 SuperMBTask *mur;
nengel@3 336 SuperMBTask *mprev;
nengel@3 337 SuperMBTask *m;
nengel@3 338 SuperMBContext *smbc;
nengel@3 339 } decode_3dwave_super_mb_taskArgs;
nengel@3 340
nengel@3 341 int32 decode_3dwave_super_mb_taskArgTypes[7] = {IN, IN, IN, IN, IN, INOUT, NONCTLD};
nengel@3 342 int32 decode_3dwave_super_mb_taskArgSizes[7] = {sizeof(MBRecContext), sizeof(SliceBufferEntry), sizeof(SuperMBTask),
nengel@3 343 sizeof(SuperMBTask), sizeof(SuperMBTask), sizeof(SuperMBTask), sizeof(SuperMBContext)};
nengel@3 344
nengel@3 345 //#pragma omp task input(*d, *sbe, *ml, *mur, *mprev) inout(*m)
nengel@7 346 static void decode_3dwave_super_mb_task(void *_data){
nengel@3 347 decode_3dwave_super_mb_taskArgs* args = (decode_3dwave_super_mb_taskArgs*) _data;
nengel@3 348 MBRecContext *d = args->d;
nengel@3 349 SliceBufferEntry *sbe = args->sbe;
nengel@3 350 SuperMBTask *ml = args->ml;
nengel@3 351 SuperMBTask *mur = args->mur;
nengel@3 352 SuperMBTask *mprev = args->mprev;
nengel@3 353 SuperMBTask *m = args->m;
nengel@3 354 SuperMBContext *smbc = args->smbc;
nengel@3 355
nengel@2 356 H264Slice *s = &sbe->slice;
nengel@2 357 H264Mb *mbs = sbe->mbs;
nengel@2 358
nengel@2 359 decode_super_mb_block(d, s, smbc, mbs, m->smb_x, m->smb_y);
nengel@7 360 VSs__end_task();
nengel@2 361 }
nengel@2 362
nengel@3 363 VSsTaskType decode_3dwave_super_mb_taskType = {
nengel@3 364 .fn = &decode_3dwave_super_mb_task,
nengel@3 365 .numCtldArgs = 6,
nengel@3 366 .numTotalArgs = 7,
nengel@3 367 .sizeOfArgs = sizeof(decode_3dwave_super_mb_taskArgs),
nengel@3 368 .argTypes = decode_3dwave_super_mb_taskArgTypes,
nengel@3 369 .argSizes = decode_3dwave_super_mb_taskArgSizes};
nengel@3 370
nengel@2 371 // int init_ref_count=0;
nengel@3 372 typedef struct{
nengel@3 373 MBRecContext *d;
nengel@3 374 SliceBufferEntry *sbe;
nengel@3 375 int* init;
nengel@3 376 H264Context *h;
nengel@3 377 } init_ref_list_and_get_dpb_taskArgs;
nengel@3 378
nengel@3 379 int32 init_ref_list_and_get_dpb_taskArgTypes[4] = {INOUT, INOUT, INOUT, NONCTLD};
nengel@3 380 int32 init_ref_list_and_get_dpb_taskArgSizes[4] = {sizeof(MBRecContext), sizeof(SliceBufferEntry), sizeof(int), sizeof(H264Context)};
nengel@3 381
nengel@3 382 //#pragma omp task inout(*d, *sbe, *init)
nengel@7 383 static void init_ref_list_and_get_dpb_task(void *_data){
nengel@3 384 init_ref_list_and_get_dpb_taskArgs* args = (init_ref_list_and_get_dpb_taskArgs*) _data;
nengel@3 385 MBRecContext *d = args->d;
nengel@3 386 SliceBufferEntry *sbe = args->sbe;
nengel@3 387 int* initp = args->init;
nengel@3 388 H264Context *h = args->h;
nengel@3 389
nengel@2 390 H264Slice *s = &sbe->slice;
nengel@2 391 for (int i=0; i<2; i++){
nengel@2 392 for(int j=0; j< s->ref_count[i]; j++){
nengel@2 393 if (s->ref_list_cpn[i][j] ==-1)
nengel@2 394 continue;
nengel@2 395 int k;
nengel@2 396 for (k=0; k<h->max_dpb_cnt; k++){
nengel@2 397 if(h->dpb[k].reference >= 2 && h->dpb[k].cpn == s->ref_list_cpn[i][j]){
nengel@2 398 s->dp_ref_list[i][j] = &h->dpb[k];
nengel@2 399 break;
nengel@2 400 }
nengel@2 401 }
nengel@2 402 }
nengel@2 403 }
nengel@2 404
nengel@3 405 //#pragma omp critical (dpb)
nengel@7 406 VSs__start_critical(0);
nengel@2 407 get_dpb_entry(h, s);
nengel@7 408 VSs__end_critical(0);
nengel@3 409
nengel@7 410 VSs__end_task();
nengel@2 411 }
nengel@2 412
nengel@3 413 VSsTaskType init_ref_list_and_get_dpb_taskType = {
nengel@3 414 .fn = &init_ref_list_and_get_dpb_task,
nengel@3 415 .numCtldArgs = 3,
nengel@3 416 .numTotalArgs = 4,
nengel@3 417 .sizeOfArgs = sizeof(init_ref_list_and_get_dpb_taskArgs),
nengel@3 418 .argTypes = init_ref_list_and_get_dpb_taskArgTypes,
nengel@3 419 .argSizes = init_ref_list_and_get_dpb_taskArgSizes};
nengel@3 420
nengel@7 421 static SuperMBTask* add_decode_slice_3dwave_tasks(MBRecContext *d, SliceBufferEntry *sbe, SuperMBContext *smbc, int k){
nengel@2 422 int i,j;
nengel@2 423
nengel@5 424 int32* taskID;
nengel@5 425
nengel@2 426 int smb_3d_height =smbc->nsmb_3dheight;
nengel@2 427 int smb_height =smbc->nsmb_height, smb_width= smbc->nsmb_width;
nengel@2 428 int smb_diff_prev = smb_height - smb_3d_height;
nengel@2 429 SuperMBTask *sm=NULL, *sml, *smur, *smprev;
nengel@2 430
nengel@2 431 SuperMBTask *smbs = smbc->smbs[smbc->index++]; smbc->index%=2;
nengel@2 432 SuperMBTask *smbs_prev = smbc->smbs[smbc->index]; // index rotates -> next == prev
nengel@2 433
nengel@2 434 for(j=0; j<smb_3d_height ; j++){
nengel@2 435 for(i=0; i< smb_width; i++){
nengel@2 436 sm = smbs + j*smb_width + i;
nengel@2 437 sml = sm - ((i > 0) ? 1: 0);
nengel@2 438 smur = sm + (((i < smb_width-1) && (j >0)) ? -smb_width+1: 0);
nengel@2 439 smprev = smbs_prev + (j + smb_diff_prev+1)*smb_width -1;
nengel@3 440 decode_3dwave_super_mb_taskArgs decode_3dwave_super_mb_task_args;
nengel@3 441 decode_3dwave_super_mb_task_args.d = d;
nengel@3 442 decode_3dwave_super_mb_task_args.sbe = sbe;
nengel@3 443 decode_3dwave_super_mb_task_args.smbc = smbc;
nengel@3 444 decode_3dwave_super_mb_task_args.ml = sml;
nengel@3 445 decode_3dwave_super_mb_task_args.mur = smur;
nengel@3 446 decode_3dwave_super_mb_task_args.mprev = smprev;
nengel@3 447 decode_3dwave_super_mb_task_args.m = sm;
nengel@7 448 taskID = VSs__create_taskID_of_size(3 );
nengel@5 449 taskID[1] = k;
nengel@5 450 taskID[2] = j;
nengel@5 451 taskID[3] = i;
nengel@7 452 VSs__submit_task_with_ID(&decode_3dwave_super_mb_taskType, &decode_3dwave_super_mb_task_args, taskID);
nengel@2 453 }
nengel@3 454 draw_edges_taskArgs draw_edges_task_args;
nengel@3 455 draw_edges_task_args.d = d;
nengel@3 456 draw_edges_task_args.sbe = sbe;
nengel@3 457 draw_edges_task_args.sm = sm;
nengel@3 458 draw_edges_task_args.smbc = smbc;
nengel@3 459 draw_edges_task_args.line = VMS_App__malloc( sizeof(int) );
nengel@3 460 *(draw_edges_task_args.line) = j;
nengel@7 461 taskID = VSs__create_taskID_of_size(3);
nengel@5 462 taskID[1] = k;
nengel@5 463 taskID[2] = j;
nengel@5 464 taskID[3] = i;
nengel@7 465 VSs__submit_task_with_ID(&draw_edges_taskType, &draw_edges_task_args, taskID);
nengel@2 466 }
nengel@2 467
nengel@2 468 for(; j< smb_height; j++){
nengel@2 469 for(i=0; i< smb_width; i++){
nengel@2 470 sm = smbs + j*smb_width + i;
nengel@2 471 sml = sm - ((i > 0) ? 1: 0);
nengel@2 472 smur = sm + (((i < smb_width-1) && (j >0)) ? -smb_width+1: 0);
nengel@3 473 decode_super_mb_taskArgs decode_super_mb_task_args;
nengel@3 474 decode_super_mb_task_args.d = d;
nengel@3 475 decode_super_mb_task_args.sbe = sbe;
nengel@3 476 decode_super_mb_task_args.smbc = smbc;
nengel@3 477 decode_super_mb_task_args.ml = sml;
nengel@3 478 decode_super_mb_task_args.mur = smur;
nengel@3 479 decode_super_mb_task_args.m = sm;
nengel@7 480 taskID = VSs__create_taskID_of_size(3 );
nengel@5 481 taskID[1] = k;
nengel@5 482 taskID[2] = j;
nengel@5 483 taskID[3] = i;
nengel@7 484 VSs__submit_task_with_ID(&decode_super_mb_taskType, &decode_super_mb_task_args, taskID);
nengel@2 485 }
nengel@3 486 draw_edges_taskArgs draw_edges_task_args;
nengel@3 487 draw_edges_task_args.d = d;
nengel@3 488 draw_edges_task_args.sbe = sbe;
nengel@3 489 draw_edges_task_args.sm = sm;
nengel@3 490 draw_edges_task_args.smbc = smbc;
nengel@3 491 draw_edges_task_args.line = VMS_App__malloc( sizeof(int) );
nengel@3 492 *(draw_edges_task_args.line) = j;
nengel@7 493 taskID = VSs__create_taskID_of_size(3);
nengel@5 494 taskID[1] = k;
nengel@5 495 taskID[2] = j;
nengel@5 496 taskID[3] = i;
nengel@7 497 VSs__submit_task_with_ID(&draw_edges_taskType, &draw_edges_task_args, taskID);
nengel@2 498 }
nengel@2 499 return sm;
nengel@2 500 }
nengel@2 501
nengel@3 502 typedef struct{
nengel@3 503 MBRecContext *d;
nengel@3 504 SliceBufferEntry *sbe;
nengel@3 505 SuperMBTask *lastsmb;
nengel@3 506 int* release;
nengel@3 507 H264Context *h;
nengel@3 508 SuperMBContext *smbc;
nengel@3 509 } release_ref_list_taskArgs;
nengel@3 510
nengel@3 511 int32 release_ref_list_taskArgTypes[6] = {INOUT, INOUT, IN, INOUT, NONCTLD, NONCTLD};
nengel@3 512 int32 release_ref_list_taskArgSizes[6] = {sizeof(MBRecContext), sizeof(SliceBufferEntry), sizeof(SuperMBTask), sizeof(int), sizeof(H264Context), sizeof(SuperMBContext)};
nengel@3 513
nengel@3 514 //#pragma omp task inout(*d, *sbe, *release) input (*lastsmb)
nengel@7 515 static void release_ref_list_task(void *_data){
nengel@3 516 release_ref_list_taskArgs* args = (release_ref_list_taskArgs*) _data;
nengel@3 517 MBRecContext *d = args->d;
nengel@3 518 SliceBufferEntry *sbe = args->sbe;
nengel@3 519 SuperMBTask *lastsmb = args->lastsmb;
nengel@3 520 int* releasep = args->release;
nengel@3 521 H264Context *h = args->h;
nengel@3 522 SuperMBContext *smbc = args->smbc;
nengel@3 523
nengel@2 524 H264Slice *s = &sbe->slice;
nengel@2 525 for (int i=0; i<s->release_cnt; i++){
nengel@2 526 for(int j=0; j<h->max_dpb_cnt; j++){
nengel@2 527 if(h->dpb[j].cpn== s->release_ref_cpn[i]){
nengel@3 528 //#pragma omp critical (dpb)
nengel@7 529 VSs__start_critical(0);
nengel@2 530 release_dpb_entry(h, &h->dpb[j], 2);
nengel@7 531 VSs__end_critical(0);
nengel@2 532 break;
nengel@2 533 }
nengel@2 534 }
nengel@2 535 }
nengel@2 536 s->release_cnt=0;
nengel@2 537
nengel@2 538 release_smbc(h, smbc);
nengel@2 539
nengel@7 540 VSs__end_task();
nengel@2 541 }
nengel@2 542
nengel@3 543 VSsTaskType release_ref_list_taskType = {
nengel@3 544 .fn = &release_ref_list_task,
nengel@3 545 .numCtldArgs = 4,
nengel@3 546 .numTotalArgs = 6,
nengel@3 547 .sizeOfArgs = sizeof(release_ref_list_taskArgs),
nengel@3 548 .argTypes = release_ref_list_taskArgTypes,
nengel@3 549 .argSizes = release_ref_list_taskArgSizes};
nengel@3 550
nengel@2 551 // static void decode_mb_static_3dwave(H264Context *h, int mb_height, int mb_width, MBRecContext *d, H264Slice *s, H264Mb *mbs, SuperMBTask *smbs, SuperMBTask *smbs_prev){
nengel@2 552 //
nengel@2 553 // }
nengel@2 554 /*-------------------------------------------------------------------------------*/
nengel@2 555 //end for static 3d wave
nengel@2 556
nengel@3 557 typedef struct{
nengel@3 558 OutputContext *oc;
nengel@3 559 SliceBufferEntry *sbe;
nengel@3 560 H264Context *h;
nengel@3 561 } output_taskArgs;
nengel@3 562
nengel@3 563 int32 output_taskArgTypes[3] = {INOUT, IN, NONCTLD};
nengel@3 564 int32 output_taskArgSizes[3] = {sizeof(OutputContext), sizeof(SliceBufferEntry), sizeof(H264Context)};
nengel@3 565
nengel@3 566 //#pragma omp task inout (*oc) input(*sbe)
nengel@7 567 static void output_task(void *_data){
nengel@3 568 output_taskArgs* args = (output_taskArgs*) _data;
nengel@3 569 OutputContext *oc = args->oc;
nengel@3 570 SliceBufferEntry *sbe = args->sbe;
nengel@3 571 H264Context *h = args->h;
nengel@3 572
nengel@2 573 DecodedPicture* out =output_frame(h, oc, sbe->slice.curr_pic, h->ofile, h->frame_width, h->frame_height);
nengel@2 574 if (out){
nengel@3 575 //#pragma omp critical (dpb)
nengel@7 576 VSs__start_critical(0);
nengel@2 577 release_dpb_entry(h, out, 1);
nengel@7 578 VSs__end_critical(0);
nengel@2 579 }
nengel@6 580 //print_report(oc->frame_number, oc->video_size, 0, h->verbose);
nengel@3 581
nengel@7 582 VSs__end_task();
nengel@2 583 }
nengel@2 584
nengel@3 585 VSsTaskType output_taskType = {
nengel@3 586 .fn = &output_task,
nengel@3 587 .numCtldArgs = 2,
nengel@3 588 .numTotalArgs = 3,
nengel@3 589 .sizeOfArgs = sizeof(output_taskArgs),
nengel@3 590 .argTypes = output_taskArgTypes,
nengel@3 591 .argSizes = output_taskArgSizes};
nengel@3 592
nengel@2 593 /*
nengel@2 594 * The following code is the main loop of the file converter
nengel@2 595 */
nengel@3 596
nengel@7 597 int h264_decode_ompss( H264Context *h) {
nengel@3 598
nengel@2 599 const int bufs = h->pipe_bufs;
nengel@2 600
nengel@2 601 ParserContext *pc;
nengel@2 602 NalContext *nc;
nengel@2 603 EntropyContext *ec[bufs];
nengel@2 604 MBRecContext *rc[2];
nengel@2 605 OutputContext *oc;
nengel@2 606 SliceBufferEntry *sbe;
nengel@2 607 SuperMBContext *smbc;
nengel@2 608
nengel@2 609 DecodedPicture *out;
nengel@2 610 int frames=0;
nengel@4 611
nengel@4 612 int32* taskID;
nengel@2 613
nengel@2 614 #if HAVE_LIBSDL2
nengel@2 615 pthread_t sdl_thr;
nengel@2 616 if (h->display){
nengel@2 617 pthread_create(&sdl_thr, NULL, sdl_thread, h);
nengel@2 618 }
nengel@2 619 #endif
nengel@3 620 /*sbe= VMS_WL__malloc(sizeof(SliceBufferEntry) * bufs);
nengel@3 621 if (sbe)
nengel@3 622 memset(sbe, 0, sizeof(SliceBufferEntry) * bufs);*/
nengel@2 623 sbe= av_mallocz(sizeof(SliceBufferEntry) * bufs);
nengel@2 624
nengel@2 625 pc = get_parse_context(h->ifile);
nengel@2 626 nc = get_nal_context(h->width, h->height);
nengel@2 627
nengel@2 628 for(int i=0; i<bufs; i++){
nengel@2 629 ec[i] = get_entropy_context( h );
nengel@2 630 }
nengel@2 631
nengel@2 632 for(int i=0; i<2; i++){
nengel@2 633 rc[i] = get_mbrec_context(h);
nengel@2 634 }
nengel@2 635
nengel@2 636 oc = get_output_context( h );
nengel@2 637
nengel@2 638 av_start_timer();
nengel@2 639 int k=0; int init, release;
nengel@2 640 if (h->static_3d && bufs < h->num_frames ){
nengel@2 641 int num_pre_ed =0;
nengel@2 642 for (num_pre_ed=0; num_pre_ed< bufs -1 && !pc->final_frame; num_pre_ed++){
nengel@3 643 parse_taskArgs parse_task_args;
nengel@3 644 parse_task_args.h = h;
nengel@3 645 parse_task_args.pc = pc;
nengel@3 646 parse_task_args.nc = nc;
nengel@3 647 parse_task_args.sbe = &sbe[k%bufs];
nengel@7 648 taskID = VSs__create_taskID_of_size(2);
nengel@4 649 taskID[1] = 1;
nengel@5 650 taskID[2] = k;
nengel@7 651 VSs__submit_task_with_ID(&parse_taskType, &parse_task_args, taskID);
nengel@3 652
nengel@3 653 decode_slice_entropy_taskArgs decode_slice_entropy_task_args;
nengel@3 654 decode_slice_entropy_task_args.h = h;
nengel@3 655 decode_slice_entropy_task_args.ec = ec[k%bufs];
nengel@3 656 decode_slice_entropy_task_args.sbe = &sbe[k%bufs];
nengel@7 657 taskID = VSs__create_taskID_of_size(2);
nengel@4 658 taskID[1] = 2;
nengel@5 659 taskID[2] = k;
nengel@7 660 VSs__submit_task_with_ID(&decode_slice_entropy_taskType, &decode_slice_entropy_task_args, taskID);
nengel@3 661 //#pragma omp taskwait on(*pc)
nengel@7 662 VSs__taskwait_on(pc);
nengel@2 663 k++;
nengel@2 664 }
nengel@2 665
nengel@2 666 while(!pc->final_frame && frames++ < h->num_frames && !h->quit){
nengel@3 667 parse_taskArgs parse_task_args;
nengel@3 668 parse_task_args.h = h;
nengel@3 669 parse_task_args.pc = pc;
nengel@3 670 parse_task_args.nc = nc;
nengel@3 671 parse_task_args.sbe = &sbe[k%bufs];
nengel@7 672 taskID = VSs__create_taskID_of_size(2);
nengel@4 673 taskID[1] = 3;
nengel@5 674 taskID[2] = k;
nengel@7 675 VSs__submit_task_with_ID(&parse_taskType, &parse_task_args, taskID);
nengel@3 676
nengel@3 677 decode_slice_entropy_taskArgs decode_slice_entropy_task_args;
nengel@3 678 decode_slice_entropy_task_args.h = h;
nengel@3 679 decode_slice_entropy_task_args.ec = ec[k%bufs];
nengel@3 680 decode_slice_entropy_task_args.sbe = &sbe[k%bufs];
nengel@7 681 taskID = VSs__create_taskID_of_size(2);
nengel@4 682 taskID[1] = 4;
nengel@5 683 taskID[2] = k;
nengel@7 684 VSs__submit_task_with_ID(&decode_slice_entropy_taskType, &decode_slice_entropy_task_args, taskID);
nengel@2 685
nengel@2 686 k++;
nengel@3 687
nengel@3 688 init_ref_list_and_get_dpb_taskArgs init_ref_list_and_get_dpb_task_args;
nengel@3 689 init_ref_list_and_get_dpb_task_args.h = h;
nengel@3 690 init_ref_list_and_get_dpb_task_args.d = rc[k%2];
nengel@3 691 init_ref_list_and_get_dpb_task_args.sbe = &sbe[k%bufs];
nengel@3 692 init_ref_list_and_get_dpb_task_args.init = &init;
nengel@7 693 taskID = VSs__create_taskID_of_size(2);
nengel@4 694 taskID[1] = 5;
nengel@5 695 taskID[2] = k;
nengel@7 696 VSs__submit_task_with_ID(&init_ref_list_and_get_dpb_taskType, &init_ref_list_and_get_dpb_task_args, taskID);
nengel@2 697
nengel@2 698 smbc = acquire_smbc(h);
nengel@7 699 SuperMBTask *lastsmb= add_decode_slice_3dwave_tasks(rc[k%2], &sbe[k%bufs], smbc, k);
nengel@3 700 release_ref_list_taskArgs release_ref_list_task_args;
nengel@3 701 release_ref_list_task_args.h = h;
nengel@3 702 release_ref_list_task_args.smbc = smbc;
nengel@3 703 release_ref_list_task_args.d = rc[k%2];
nengel@3 704 release_ref_list_task_args.sbe = &sbe[k%bufs];
nengel@3 705 release_ref_list_task_args.lastsmb = lastsmb;
nengel@3 706 release_ref_list_task_args.release = &release;
nengel@7 707 taskID = VSs__create_taskID_of_size(2);
nengel@4 708 taskID[1] = 6;
nengel@5 709 taskID[2] = k;
nengel@7 710 VSs__submit_task_with_ID(&release_ref_list_taskType, &release_ref_list_task_args, taskID);
nengel@2 711
nengel@3 712 output_taskArgs output_task_args;
nengel@3 713 output_task_args.h = h;
nengel@3 714 output_task_args.oc = oc;
nengel@3 715 output_task_args.sbe = &sbe[k%bufs];
nengel@7 716 taskID = VSs__create_taskID_of_size(2);
nengel@4 717 taskID[1] = 7;
nengel@5 718 taskID[2] = k;
nengel@7 719 VSs__submit_task_with_ID(&output_taskType, &output_task_args, taskID);
nengel@3 720 //#pragma omp taskwait on(*pc)
nengel@7 721 VSs__taskwait_on(pc);
nengel@2 722 }
nengel@2 723
nengel@2 724 for (int i=0; i< num_pre_ed; i++){
nengel@2 725 k++;
nengel@3 726 init_ref_list_and_get_dpb_taskArgs init_ref_list_and_get_dpb_task_args;
nengel@3 727 init_ref_list_and_get_dpb_task_args.h = h;
nengel@3 728 init_ref_list_and_get_dpb_task_args.d = rc[k%2];
nengel@3 729 init_ref_list_and_get_dpb_task_args.sbe = &sbe[k%bufs];
nengel@3 730 init_ref_list_and_get_dpb_task_args.init = &init;
nengel@7 731 taskID = VSs__create_taskID_of_size(2);
nengel@4 732 taskID[1] = 8;
nengel@4 733 taskID[2] = i;
nengel@7 734 VSs__submit_task_with_ID(&init_ref_list_and_get_dpb_taskType, &init_ref_list_and_get_dpb_task_args, taskID);
nengel@2 735 smbc = acquire_smbc(h);
nengel@7 736 SuperMBTask *lastsmb= add_decode_slice_3dwave_tasks(rc[k%2], &sbe[k%bufs], smbc, k);
nengel@3 737 release_ref_list_taskArgs release_ref_list_task_args;
nengel@3 738 release_ref_list_task_args.h = h;
nengel@3 739 release_ref_list_task_args.smbc = smbc;
nengel@3 740 release_ref_list_task_args.d = rc[k%2];
nengel@3 741 release_ref_list_task_args.sbe = &sbe[k%bufs];
nengel@3 742 release_ref_list_task_args.lastsmb = lastsmb;
nengel@3 743 release_ref_list_task_args.release = &release;
nengel@7 744 taskID = VSs__create_taskID_of_size(2);
nengel@4 745 taskID[1] = 9;
nengel@5 746 taskID[2] = k;
nengel@7 747 VSs__submit_task_with_ID(&release_ref_list_taskType, &release_ref_list_task_args, taskID);
nengel@2 748
nengel@3 749 output_taskArgs output_task_args;
nengel@3 750 output_task_args.h = h;
nengel@3 751 output_task_args.oc = oc;
nengel@3 752 output_task_args.sbe = &sbe[k%bufs];
nengel@7 753 taskID = VSs__create_taskID_of_size(2);
nengel@4 754 taskID[1] = 10;
nengel@5 755 taskID[2] = k;
nengel@7 756 VSs__submit_task_with_ID(&output_taskType, &output_task_args, taskID);
nengel@2 757 }
nengel@2 758
nengel@2 759 } else {
nengel@2 760 while(!pc->final_frame && frames++ < h->num_frames && !h->quit){
nengel@4 761
nengel@7 762 taskID = VSs__create_taskID_of_size(1);
nengel@3 763 taskID[1] = frames*10+1;
nengel@3 764 parse_taskArgs parse_task_args;
nengel@3 765 parse_task_args.h = h;
nengel@3 766 parse_task_args.pc = pc;
nengel@3 767 parse_task_args.nc = nc;
nengel@3 768 parse_task_args.sbe = &sbe[k%bufs];
nengel@7 769 VSs__submit_task_with_ID(&parse_taskType, &parse_task_args, taskID);
nengel@2 770
nengel@7 771 taskID = VSs__create_taskID_of_size(1);
nengel@3 772 taskID[1] = frames*10+2;
nengel@3 773 decode_slice_entropy_taskArgs decode_slice_entropy_task_args;
nengel@3 774 decode_slice_entropy_task_args.h = h;
nengel@3 775 decode_slice_entropy_task_args.ec = ec[k%bufs];
nengel@3 776 decode_slice_entropy_task_args.sbe = &sbe[k%bufs];
nengel@7 777 VSs__submit_task_with_ID(&decode_slice_entropy_taskType, &decode_slice_entropy_task_args,taskID);
nengel@2 778
nengel@7 779 taskID = VSs__create_taskID_of_size(1);
nengel@3 780 taskID[1] = frames*10+3;
nengel@3 781 decode_slice_mb_taskArgs decode_slice_mb_task_args;
nengel@3 782 decode_slice_mb_task_args.h = h;
nengel@3 783 decode_slice_mb_task_args.d = rc[0];
nengel@3 784 decode_slice_mb_task_args.sbe = &sbe[k%bufs];
nengel@7 785 VSs__submit_task_with_ID(&decode_slice_mb_taskType, &decode_slice_mb_task_args,taskID);
nengel@2 786
nengel@7 787 taskID = VSs__create_taskID_of_size(1);
nengel@3 788 taskID[1] = frames*10+4;
nengel@3 789 output_taskArgs output_task_args;
nengel@3 790 output_task_args.h = h;
nengel@3 791 output_task_args.oc = oc;
nengel@3 792 output_task_args.sbe = &sbe[k%bufs];
nengel@7 793 VSs__submit_task_with_ID(&output_taskType, &output_task_args,taskID);
nengel@3 794 //#pragma omp taskwait on(*pc)
nengel@7 795 VSs__taskwait_on(pc);
nengel@2 796 k++;
nengel@2 797 }
nengel@2 798 }
nengel@3 799 //#pragma omp taskwait
nengel@7 800 VSs__taskwait();
nengel@3 801
nengel@2 802 while ((out=output_frame(h, oc, NULL, h->ofile, h->frame_width, h->frame_height))) ;
nengel@2 803
nengel@6 804 //print_report(oc->frame_number, oc->video_size, 1, h->verbose);
nengel@2 805 h->num_frames = oc->frame_number;
nengel@2 806 /* finished ! */
nengel@2 807
nengel@2 808 free_parse_context(pc);
nengel@2 809 free_nal_context (nc);
nengel@2 810 free_output_context(oc);
nengel@2 811 for (int i=0; i<bufs; i++){
nengel@2 812 free_sb_entry(&sbe[i]);
nengel@2 813 free_entropy_context(ec[i]);
nengel@2 814 }
nengel@2 815 av_free(sbe);
nengel@2 816
nengel@2 817 for (int i=0; i<2; i++){
nengel@2 818 free_mbrec_context(rc[i]);
nengel@2 819 }
nengel@2 820
nengel@2 821 #if HAVE_LIBSDL2
nengel@2 822 if (h->display){
nengel@2 823 signal_sdl_exit(h);
nengel@2 824 pthread_join(sdl_thr, NULL);
nengel@2 825 }
nengel@2 826 #endif
nengel@2 827
nengel@7 828 return 0;
nengel@2 829 }