/* * H.265 video codec. * Copyright (c) 2013-2014 struktur AG, Dirk Farin * * This file is part of libde265. * * libde265 is free software: you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as * published by the Free Software Foundation, either version 3 of * the License, or (at your option) any later version. * * libde265 is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with libde265. If not, see . */ #include "decctx.h" #include "util.h" #include "sao.h" #include "sei.h" #include "deblock.h" #include #include #include #include #include #include "fallback.h" #ifdef HAVE_CONFIG_H #include "config.h" #endif #ifdef HAVE_SSE4_1 #include "x86/sse.h" #endif #ifdef HAVE_ARM #include "arm/arm.h" #endif #define SAVE_INTERMEDIATE_IMAGES 0 #if SAVE_INTERMEDIATE_IMAGES #include "visualize.h" #endif extern void thread_decode_CTB_row(void* d); extern void thread_decode_slice_segment(void* d); thread_context::thread_context() { /* CtbAddrInRS = 0; CtbAddrInTS = 0; CtbX = 0; CtbY = 0; */ /* refIdx[0] = refIdx[1] = 0; mvd[0][0] = mvd[0][1] = mvd[1][0] = mvd[1][1] = 0; merge_flag = 0; merge_idx = 0; mvp_lX_flag[0] = mvp_lX_flag[1] = 0; inter_pred_idc = 0; */ /* enum IntraPredMode IntraPredModeC; // chroma intra-prediction mode for current CB */ /* cu_transquant_bypass_flag = false; memset(transform_skip_flag,0, 3*sizeof(uint8_t)); */ //memset(coeffList,0,sizeof(int16_t)*3*32*32); //memset(coeffPos,0,sizeof(int16_t)*3*32*32); //memset(nCoeff,0,sizeof(int16_t)*3); IsCuQpDeltaCoded = false; CuQpDelta = 0; IsCuChromaQpOffsetCoded = false; CuQpOffsetCb = 0; CuQpOffsetCr = 0; /* currentQPY = 0; currentQG_x = 0; currentQG_y = 0; lastQPYinPreviousQG = 0; */ /* qPYPrime = 0; qPCbPrime = 0; qPCrPrime = 0; */ /* memset(&cabac_decoder, 0, sizeof(CABAC_decoder)); memset(&ctx_model, 0, sizeof(ctx_model)); */ decctx = NULL; img = NULL; shdr = NULL; imgunit = NULL; sliceunit = NULL; //memset(this,0,sizeof(thread_context)); // There is a interesting issue here. When aligning _coeffBuf to 16 bytes offset with // __attribute__((align(16))), the following statement is optimized away since the // compiler assumes that the pointer would be 16-byte aligned. However, this is not the // case when the structure has been dynamically allocated. In this case, the base can // also be at 8 byte offsets (at least with MingW,32 bit). int offset = ((uintptr_t)_coeffBuf) & 0xf; if (offset == 0) { coeffBuf = _coeffBuf; // correctly aligned already } else { coeffBuf = (int16_t *) (((uint8_t *)_coeffBuf) + (16-offset)); } memset(coeffBuf, 0, 32*32*sizeof(int16_t)); } slice_unit::slice_unit(decoder_context* decctx) : nal(NULL), shdr(NULL), imgunit(NULL), flush_reorder_buffer(false), nThreads(0), first_decoded_CTB_RS(-1), last_decoded_CTB_RS(-1), thread_contexts(NULL), ctx(decctx) { state = Unprocessed; nThreadContexts = 0; } slice_unit::~slice_unit() { ctx->nal_parser.free_NAL_unit(nal); if (thread_contexts) { delete[] thread_contexts; } } void slice_unit::allocate_thread_contexts(int n) { assert(thread_contexts==NULL); thread_contexts = new thread_context[n]; nThreadContexts = n; } image_unit::image_unit() { img=NULL; role=Invalid; state=Unprocessed; } image_unit::~image_unit() { for (int i=0;iFirstAfterEndOfSequenceNAL = true; //ctx->last_RAP_picture_NAL_type = NAL_UNIT_UNDEFINED; //de265_init_image(&ctx->coeff); // --- decoded picture buffer --- current_image_poc_lsb = -1; // any invalid number } decoder_context::~decoder_context() { while (!image_units.empty()) { delete image_units.back(); image_units.pop_back(); } } void decoder_context::set_image_allocation_functions(de265_image_allocation* allocfunc, void* userdata) { if (allocfunc) { param_image_allocation_functions = *allocfunc; param_image_allocation_userdata = userdata; } else { assert(false); // actually, it makes no sense to reset the allocation functions param_image_allocation_functions = de265_image::default_image_allocation; param_image_allocation_userdata = NULL; } } de265_error decoder_context::start_thread_pool(int nThreads) { ::start_thread_pool(&thread_pool_, nThreads); num_worker_threads = nThreads; return DE265_OK; } void decoder_context::stop_thread_pool() { if (get_num_worker_threads()>0) { //flush_thread_pool(&ctx->thread_pool); ::stop_thread_pool(&thread_pool_); } } void decoder_context::reset() { if (num_worker_threads>0) { //flush_thread_pool(&ctx->thread_pool); ::stop_thread_pool(&thread_pool_); } // -------------------------------------------------- #if 0 ctx->end_of_stream = false; ctx->pending_input_NAL = NULL; ctx->current_vps = NULL; ctx->current_sps = NULL; ctx->current_pps = NULL; ctx->num_worker_threads = 0; ctx->current_image_poc_lsb = 0; ctx->first_decoded_picture = 0; ctx->NoRaslOutputFlag = 0; ctx->HandleCraAsBlaFlag = 0; ctx->FirstAfterEndOfSequenceNAL = 0; ctx->PicOrderCntMsb = 0; ctx->prevPicOrderCntLsb = 0; ctx->prevPicOrderCntMsb = 0; ctx->NumPocStCurrBefore=0; ctx->NumPocStCurrAfter=0; ctx->NumPocStFoll=0; ctx->NumPocLtCurr=0; ctx->NumPocLtFoll=0; ctx->nal_unit_type=0; ctx->IdrPicFlag=0; ctx->RapPicFlag=0; #endif img = NULL; // TODO: remove all pending image_units // --- decoded picture buffer --- current_image_poc_lsb = -1; // any invalid number first_decoded_picture = true; // --- remove all pictures from output queue --- // there was a bug the peek_next_image did not return NULL on empty output queues. // This was (indirectly) fixed by recreating the DPB buffer, but it should actually // be sufficient to clear it like this. // The error showed while scrubbing the ToS video in VLC. dpb.clear(); nal_parser.remove_pending_input_data(); while (!image_units.empty()) { delete image_units.back(); image_units.pop_back(); } // --- start threads again --- if (num_worker_threads>0) { // TODO: need error checking start_thread_pool(num_worker_threads); } } void base_context::set_acceleration_functions(enum de265_acceleration l) { // fill scalar functions first (so that function table is completely filled) init_acceleration_functions_fallback(&acceleration); // override functions with optimized variants #ifdef HAVE_SSE4_1 if (l>=de265_acceleration_SSE) { init_acceleration_functions_sse(&acceleration); } #endif #ifdef HAVE_ARM if (l>=de265_acceleration_ARM) { init_acceleration_functions_arm(&acceleration); } #endif } void decoder_context::init_thread_context(thread_context* tctx) { // zero scrap memory for coefficient blocks memset(tctx->_coeffBuf, 0, sizeof(tctx->_coeffBuf)); // TODO: check if we can safely remove this tctx->currentQG_x = -1; tctx->currentQG_y = -1; // --- find QPY that was active at the end of the previous slice --- // find the previous CTB in TS order const pic_parameter_set& pps = tctx->img->get_pps(); const seq_parameter_set& sps = tctx->img->get_sps(); if (tctx->shdr->slice_segment_address > 0) { int prevCtb = pps.CtbAddrTStoRS[ pps.CtbAddrRStoTS[tctx->shdr->slice_segment_address] -1 ]; int ctbX = prevCtb % sps.PicWidthInCtbsY; int ctbY = prevCtb / sps.PicWidthInCtbsY; // take the pixel at the bottom right corner (but consider that the image size might be smaller) int x = ((ctbX+1) << sps.Log2CtbSizeY)-1; int y = ((ctbY+1) << sps.Log2CtbSizeY)-1; x = std::min(x,sps.pic_width_in_luma_samples-1); y = std::min(y,sps.pic_height_in_luma_samples-1); //printf("READ QPY: %d %d -> %d (should %d)\n",x,y,imgunit->img->get_QPY(x,y), tc.currentQPY); //if (tctx->shdr->dependent_slice_segment_flag) { // TODO: do we need this condition ? tctx->currentQPY = tctx->img->get_QPY(x,y); //} } } void decoder_context::add_task_decode_CTB_row(thread_context* tctx, bool firstSliceSubstream, int ctbRow) { thread_task_ctb_row* task = new thread_task_ctb_row; task->firstSliceSubstream = firstSliceSubstream; task->tctx = tctx; task->debug_startCtbRow = ctbRow; tctx->task = task; add_task(&thread_pool_, task); tctx->imgunit->tasks.push_back(task); } void decoder_context::add_task_decode_slice_segment(thread_context* tctx, bool firstSliceSubstream, int ctbx,int ctby) { thread_task_slice_segment* task = new thread_task_slice_segment; task->firstSliceSubstream = firstSliceSubstream; task->tctx = tctx; task->debug_startCtbX = ctbx; task->debug_startCtbY = ctby; tctx->task = task; add_task(&thread_pool_, task); tctx->imgunit->tasks.push_back(task); } de265_error decoder_context::read_vps_NAL(bitreader& reader) { logdebug(LogHeaders,"---> read VPS\n"); std::shared_ptr new_vps = std::make_shared(); de265_error err = new_vps->read(this,&reader); if (err != DE265_OK) { return err; } if (param_vps_headers_fd>=0) { new_vps->dump(param_vps_headers_fd); } vps[ new_vps->video_parameter_set_id ] = new_vps; return DE265_OK; } de265_error decoder_context::read_sps_NAL(bitreader& reader) { logdebug(LogHeaders,"----> read SPS\n"); std::shared_ptr new_sps = std::make_shared(); de265_error err; if ((err=new_sps->read(this, &reader)) != DE265_OK) { return err; } if (param_sps_headers_fd>=0) { new_sps->dump(param_sps_headers_fd); } sps[ new_sps->seq_parameter_set_id ] = new_sps; return DE265_OK; } de265_error decoder_context::read_pps_NAL(bitreader& reader) { logdebug(LogHeaders,"----> read PPS\n"); std::shared_ptr new_pps = std::make_shared(); bool success = new_pps->read(&reader,this); if (param_pps_headers_fd>=0) { new_pps->dump(param_pps_headers_fd); } if (success) { pps[ (int)new_pps->pic_parameter_set_id ] = new_pps; } return success ? DE265_OK : DE265_WARNING_PPS_HEADER_INVALID; } de265_error decoder_context::read_sei_NAL(bitreader& reader, bool suffix) { logdebug(LogHeaders,"----> read SEI\n"); sei_message sei; //push_current_picture_to_output_queue(); de265_error err = DE265_OK; if ((err=read_sei(&reader,&sei, suffix, current_sps.get())) == DE265_OK) { dump_sei(&sei, current_sps.get()); if (image_units.empty()==false && suffix) { image_units.back()->suffix_SEIs.push_back(sei); } } else { add_warning(err, false); } return err; } de265_error decoder_context::read_eos_NAL(bitreader& reader) { FirstAfterEndOfSequenceNAL = true; return DE265_OK; } de265_error decoder_context::read_slice_NAL(bitreader& reader, NAL_unit* nal, nal_header& nal_hdr) { logdebug(LogHeaders,"---> read slice segment header\n"); // --- read slice header --- slice_segment_header* shdr = new slice_segment_header; bool continueDecoding; de265_error err = shdr->read(&reader,this, &continueDecoding); if (!continueDecoding) { if (img) { img->integrity = INTEGRITY_NOT_DECODED; } nal_parser.free_NAL_unit(nal); delete shdr; return err; } if (param_slice_headers_fd>=0) { shdr->dump_slice_segment_header(this, param_slice_headers_fd); } if (process_slice_segment_header(shdr, &err, nal->pts, &nal_hdr, nal->user_data) == false) { if (img!=NULL) img->integrity = INTEGRITY_NOT_DECODED; nal_parser.free_NAL_unit(nal); delete shdr; return err; } this->img->add_slice_segment_header(shdr); skip_bits(&reader,1); // TODO: why? prepare_for_CABAC(&reader); // modify entry_point_offsets int headerLength = reader.data - nal->data(); for (int i=0;inum_entry_point_offsets;i++) { shdr->entry_point_offset[i] -= nal->num_skipped_bytes_before(shdr->entry_point_offset[i], headerLength); } // --- start a new image if this is the first slice --- if (shdr->first_slice_segment_in_pic_flag) { image_unit* imgunit = new image_unit; imgunit->img = this->img; image_units.push_back(imgunit); } // --- add slice to current picture --- if ( ! image_units.empty() ) { slice_unit* sliceunit = new slice_unit(this); sliceunit->nal = nal; sliceunit->shdr = shdr; sliceunit->reader = reader; sliceunit->flush_reorder_buffer = flush_reorder_buffer_at_this_frame; image_units.back()->slice_units.push_back(sliceunit); } bool did_work; err = decode_some(&did_work); return DE265_OK; } template void pop_front(std::vector& vec) { for (int i=1;islice_units.empty() ) { image_unit* imgunit = image_units[0]; slice_unit* sliceunit = imgunit->get_next_unprocessed_slice_segment(); if (sliceunit != NULL) { //pop_front(imgunit->slice_units); if (sliceunit->flush_reorder_buffer) { dpb.flush_reorder_buffer(); } *did_work = true; //err = decode_slice_unit_sequential(imgunit, sliceunit); err = decode_slice_unit_parallel(imgunit, sliceunit); if (err) { return err; } //delete sliceunit; } } // if we decoded all slices of the current image and there will not // be added any more slices to the image, output the image if ( ( image_units.size()>=2 && image_units[0]->all_slice_segments_processed()) || ( image_units.size()>=1 && image_units[0]->all_slice_segments_processed() && nal_parser.number_of_NAL_units_pending()==0 && (nal_parser.is_end_of_stream() || nal_parser.is_end_of_frame()) )) { image_unit* imgunit = image_units[0]; *did_work=true; // mark all CTBs as decoded even if they are not, because faulty input // streams could miss part of the picture // TODO: this will not work when slice decoding is parallel to post-filtering, // so we will have to replace this with keeping track of which CTB should have // been decoded (but aren't because of the input stream being faulty) imgunit->img->mark_all_CTB_progress(CTB_PROGRESS_PREFILTER); // run post-processing filters (deblocking & SAO) if (img->decctx->num_worker_threads) run_postprocessing_filters_parallel(imgunit); else run_postprocessing_filters_sequential(imgunit->img); // process suffix SEIs for (int i=0;isuffix_SEIs.size();i++) { const sei_message& sei = imgunit->suffix_SEIs[i]; err = process_sei(&sei, imgunit->img); if (err != DE265_OK) break; } push_picture_to_output_queue(imgunit); // remove just decoded image unit from queue delete imgunit; pop_front(image_units); } return err; } de265_error decoder_context::decode_slice_unit_sequential(image_unit* imgunit, slice_unit* sliceunit) { de265_error err = DE265_OK; /* printf("decode slice POC=%d addr=%d, img=%p\n", sliceunit->shdr->slice_pic_order_cnt_lsb, sliceunit->shdr->slice_segment_address, imgunit->img); */ remove_images_from_dpb(sliceunit->shdr->RemoveReferencesList); if (sliceunit->shdr->slice_segment_address >= imgunit->img->get_pps().CtbAddrRStoTS.size()) { return DE265_ERROR_CTB_OUTSIDE_IMAGE_AREA; } struct thread_context tctx; tctx.shdr = sliceunit->shdr; tctx.img = imgunit->img; tctx.decctx = this; tctx.imgunit = imgunit; tctx.sliceunit= sliceunit; tctx.CtbAddrInTS = imgunit->img->get_pps().CtbAddrRStoTS[tctx.shdr->slice_segment_address]; tctx.task = NULL; init_thread_context(&tctx); if (sliceunit->reader.bytes_remaining <= 0) { return DE265_ERROR_PREMATURE_END_OF_SLICE; } init_CABAC_decoder(&tctx.cabac_decoder, sliceunit->reader.data, sliceunit->reader.bytes_remaining); // alloc CABAC-model array if entropy_coding_sync is enabled if (imgunit->img->get_pps().entropy_coding_sync_enabled_flag && sliceunit->shdr->first_slice_segment_in_pic_flag) { imgunit->ctx_models.resize( (img->get_sps().PicHeightInCtbsY-1) ); //* CONTEXT_MODEL_TABLE_LENGTH ); } sliceunit->nThreads=1; err=read_slice_segment_data(&tctx); sliceunit->finished_threads.set_progress(1); return err; } void decoder_context::mark_whole_slice_as_processed(image_unit* imgunit, slice_unit* sliceunit, int progress) { //printf("mark whole slice\n"); // mark all CTBs upto the next slice segment as processed slice_unit* nextSegment = imgunit->get_next_slice_segment(sliceunit); if (nextSegment) { /* printf("mark whole slice between %d and %d\n", sliceunit->shdr->slice_segment_address, nextSegment->shdr->slice_segment_address); */ for (int ctb=sliceunit->shdr->slice_segment_address; ctb < nextSegment->shdr->slice_segment_address; ctb++) { if (ctb >= imgunit->img->number_of_ctbs()) break; imgunit->img->ctb_progress[ctb].set_progress(progress); } } } de265_error decoder_context::decode_slice_unit_parallel(image_unit* imgunit, slice_unit* sliceunit) { de265_error err = DE265_OK; remove_images_from_dpb(sliceunit->shdr->RemoveReferencesList); /* printf("-------- decode --------\n"); printf("IMAGE UNIT %p\n",imgunit); sliceunit->shdr->dump_slice_segment_header(sliceunit->ctx, 1); imgunit->dump_slices(); */ de265_image* img = imgunit->img; const pic_parameter_set& pps = img->get_pps(); sliceunit->state = slice_unit::InProgress; bool use_WPP = (img->decctx->num_worker_threads > 0 && pps.entropy_coding_sync_enabled_flag); bool use_tiles = (img->decctx->num_worker_threads > 0 && pps.tiles_enabled_flag); // TODO: remove this warning later when we do frame-parallel decoding if (img->decctx->num_worker_threads > 0 && pps.entropy_coding_sync_enabled_flag == false && pps.tiles_enabled_flag == false) { img->decctx->add_warning(DE265_WARNING_NO_WPP_CANNOT_USE_MULTITHREADING, true); } // If this is the first slice segment, mark all CTBs before this as processed // (the real first slice segment could be missing). if (imgunit->is_first_slice_segment(sliceunit)) { slice_segment_header* shdr = sliceunit->shdr; int firstCTB = shdr->slice_segment_address; for (int ctb=0;ctbctb_progress[ctb].set_progress(CTB_PROGRESS_PREFILTER); } } // if there is a previous slice that has been completely decoded, // mark all CTBs until the start of this slice as completed //printf("this slice: %p\n",sliceunit); slice_unit* prevSlice = imgunit->get_prev_slice_segment(sliceunit); //if (prevSlice) printf("prev slice state: %d\n",prevSlice->state); if (prevSlice && prevSlice->state == slice_unit::Decoded) { mark_whole_slice_as_processed(imgunit,prevSlice,CTB_PROGRESS_PREFILTER); } // TODO: even though we cannot split this into several tasks, we should run it // as a background thread if (!use_WPP && !use_tiles) { //printf("SEQ\n"); err = decode_slice_unit_sequential(imgunit, sliceunit); sliceunit->state = slice_unit::Decoded; mark_whole_slice_as_processed(imgunit,sliceunit,CTB_PROGRESS_PREFILTER); return err; } if (use_WPP && use_tiles) { // TODO: this is not allowed ... output some warning or error return DE265_WARNING_PPS_HEADER_INVALID; } if (use_WPP) { //printf("WPP\n"); err = decode_slice_unit_WPP(imgunit, sliceunit); sliceunit->state = slice_unit::Decoded; mark_whole_slice_as_processed(imgunit,sliceunit,CTB_PROGRESS_PREFILTER); return err; } else if (use_tiles) { //printf("TILE\n"); err = decode_slice_unit_tiles(imgunit, sliceunit); sliceunit->state = slice_unit::Decoded; mark_whole_slice_as_processed(imgunit,sliceunit,CTB_PROGRESS_PREFILTER); return err; } assert(false); return err; } de265_error decoder_context::decode_slice_unit_WPP(image_unit* imgunit, slice_unit* sliceunit) { de265_error err = DE265_OK; de265_image* img = imgunit->img; slice_segment_header* shdr = sliceunit->shdr; const pic_parameter_set& pps = img->get_pps(); int nRows = shdr->num_entry_point_offsets +1; int ctbsWidth = img->get_sps().PicWidthInCtbsY; assert(img->num_threads_active() == 0); // reserve space to store entropy coding context models for each CTB row if (shdr->first_slice_segment_in_pic_flag) { // reserve space for nRows-1 because we don't need to save the CABAC model in the last CTB row imgunit->ctx_models.resize( (img->get_sps().PicHeightInCtbsY-1) ); //* CONTEXT_MODEL_TABLE_LENGTH ); } sliceunit->allocate_thread_contexts(nRows); // first CTB in this slice int ctbAddrRS = shdr->slice_segment_address; int ctbRow = ctbAddrRS / ctbsWidth; for (int entryPt=0;entryPt0) { ctbRow++; ctbAddrRS = ctbRow * ctbsWidth; } else if (nRows>1 && (ctbAddrRS % ctbsWidth) != 0) { // If slice segment consists of several WPP rows, each of them // has to start at a row. //printf("does not start at start\n"); err = DE265_WARNING_SLICEHEADER_INVALID; break; } // prepare thread context thread_context* tctx = sliceunit->get_thread_context(entryPt); tctx->shdr = shdr; tctx->decctx = img->decctx; tctx->img = img; tctx->imgunit = imgunit; tctx->sliceunit= sliceunit; tctx->CtbAddrInTS = pps.CtbAddrRStoTS[ctbAddrRS]; init_thread_context(tctx); // init CABAC int dataStartIndex; if (entryPt==0) { dataStartIndex=0; } else { dataStartIndex=shdr->entry_point_offset[entryPt-1]; } int dataEnd; if (entryPt==nRows-1) dataEnd = sliceunit->reader.bytes_remaining; else dataEnd = shdr->entry_point_offset[entryPt]; if (dataStartIndex<0 || dataEnd>sliceunit->reader.bytes_remaining || dataEnd <= dataStartIndex) { //printf("WPP premature end\n"); err = DE265_ERROR_PREMATURE_END_OF_SLICE; break; } init_CABAC_decoder(&tctx->cabac_decoder, &sliceunit->reader.data[dataStartIndex], dataEnd-dataStartIndex); // add task //printf("start task for ctb-row: %d\n",ctbRow); img->thread_start(1); sliceunit->nThreads++; add_task_decode_CTB_row(tctx, entryPt==0, ctbRow); } #if 0 for (;;) { printf("q:%d r:%d b:%d f:%d\n", img->nThreadsQueued, img->nThreadsRunning, img->nThreadsBlocked, img->nThreadsFinished); if (img->debug_is_completed()) break; usleep(1000); } #endif img->wait_for_completion(); for (int i=0;itasks.size();i++) delete imgunit->tasks[i]; imgunit->tasks.clear(); return DE265_OK; } de265_error decoder_context::decode_slice_unit_tiles(image_unit* imgunit, slice_unit* sliceunit) { de265_error err = DE265_OK; de265_image* img = imgunit->img; slice_segment_header* shdr = sliceunit->shdr; const pic_parameter_set& pps = img->get_pps(); int nTiles = shdr->num_entry_point_offsets +1; int ctbsWidth = img->get_sps().PicWidthInCtbsY; assert(img->num_threads_active() == 0); sliceunit->allocate_thread_contexts(nTiles); // first CTB in this slice int ctbAddrRS = shdr->slice_segment_address; int tileID = pps.TileIdRS[ctbAddrRS]; for (int entryPt=0;entryPt0) { tileID++; if (tileID >= pps.num_tile_columns * pps.num_tile_rows) { err = DE265_WARNING_SLICEHEADER_INVALID; break; } int ctbX = pps.colBd[tileID % pps.num_tile_columns]; int ctbY = pps.rowBd[tileID / pps.num_tile_columns]; ctbAddrRS = ctbY * ctbsWidth + ctbX; } // set thread context thread_context* tctx = sliceunit->get_thread_context(entryPt); tctx->shdr = shdr; tctx->decctx = img->decctx; tctx->img = img; tctx->imgunit = imgunit; tctx->sliceunit= sliceunit; tctx->CtbAddrInTS = pps.CtbAddrRStoTS[ctbAddrRS]; init_thread_context(tctx); // init CABAC int dataStartIndex; if (entryPt==0) { dataStartIndex=0; } else { dataStartIndex=shdr->entry_point_offset[entryPt-1]; } int dataEnd; if (entryPt==nTiles-1) dataEnd = sliceunit->reader.bytes_remaining; else dataEnd = shdr->entry_point_offset[entryPt]; if (dataStartIndex<0 || dataEnd>sliceunit->reader.bytes_remaining || dataEnd <= dataStartIndex) { err = DE265_ERROR_PREMATURE_END_OF_SLICE; break; } init_CABAC_decoder(&tctx->cabac_decoder, &sliceunit->reader.data[dataStartIndex], dataEnd-dataStartIndex); // add task //printf("add tiles thread\n"); img->thread_start(1); sliceunit->nThreads++; add_task_decode_slice_segment(tctx, entryPt==0, ctbAddrRS % ctbsWidth, ctbAddrRS / ctbsWidth); } img->wait_for_completion(); for (int i=0;itasks.size();i++) delete imgunit->tasks[i]; imgunit->tasks.clear(); return err; } de265_error decoder_context::decode_NAL(NAL_unit* nal) { //return decode_NAL_OLD(nal); decoder_context* ctx = this; de265_error err = DE265_OK; bitreader reader; bitreader_init(&reader, nal->data(), nal->size()); nal_header nal_hdr; nal_hdr.read(&reader); ctx->process_nal_hdr(&nal_hdr); if (nal_hdr.nuh_layer_id > 0) { // Discard all NAL units with nuh_layer_id > 0 // These will have to be handeled by an SHVC decoder. nal_parser.free_NAL_unit(nal); return DE265_OK; } loginfo(LogHighlevel,"NAL: 0x%x 0x%x - unit type:%s temporal id:%d\n", nal->data()[0], nal->data()[1], get_NAL_name(nal_hdr.nal_unit_type), nal_hdr.nuh_temporal_id); /* printf("NAL: 0x%x 0x%x - unit type:%s temporal id:%d\n", nal->data()[0], nal->data()[1], get_NAL_name(nal_hdr.nal_unit_type), nal_hdr.nuh_temporal_id); */ // throw away NALs from higher TIDs than currently selected // TODO: better online switching of HighestTID //printf("hTid: %d\n", current_HighestTid); if (nal_hdr.nuh_temporal_id > current_HighestTid) { nal_parser.free_NAL_unit(nal); return DE265_OK; } if (nal_hdr.nal_unit_type<32) { err = read_slice_NAL(reader, nal, nal_hdr); } else switch (nal_hdr.nal_unit_type) { case NAL_UNIT_VPS_NUT: err = read_vps_NAL(reader); nal_parser.free_NAL_unit(nal); break; case NAL_UNIT_SPS_NUT: err = read_sps_NAL(reader); nal_parser.free_NAL_unit(nal); break; case NAL_UNIT_PPS_NUT: err = read_pps_NAL(reader); nal_parser.free_NAL_unit(nal); break; case NAL_UNIT_PREFIX_SEI_NUT: case NAL_UNIT_SUFFIX_SEI_NUT: err = read_sei_NAL(reader, nal_hdr.nal_unit_type==NAL_UNIT_SUFFIX_SEI_NUT); nal_parser.free_NAL_unit(nal); break; case NAL_UNIT_EOS_NUT: ctx->FirstAfterEndOfSequenceNAL = true; nal_parser.free_NAL_unit(nal); break; default: nal_parser.free_NAL_unit(nal); break; } return err; } de265_error decoder_context::decode(int* more) { decoder_context* ctx = this; // if the stream has ended, and no more NALs are to be decoded, flush all pictures if (ctx->nal_parser.get_NAL_queue_length() == 0 && (ctx->nal_parser.is_end_of_stream() || ctx->nal_parser.is_end_of_frame()) && ctx->image_units.empty()) { // flush all pending pictures into output queue // ctx->push_current_picture_to_output_queue(); // TODO: not with new queue ctx->dpb.flush_reorder_buffer(); if (more) { *more = ctx->dpb.num_pictures_in_output_queue(); } return DE265_OK; } // if NAL-queue is empty, we need more data // -> input stalled if (ctx->nal_parser.is_end_of_stream() == false && ctx->nal_parser.is_end_of_frame() == false && ctx->nal_parser.get_NAL_queue_length() == 0) { if (more) { *more=1; } return DE265_ERROR_WAITING_FOR_INPUT_DATA; } // when there are no free image buffers in the DPB, pause decoding // -> output stalled if (!ctx->dpb.has_free_dpb_picture(false)) { if (more) *more = 1; return DE265_ERROR_IMAGE_BUFFER_FULL; } // decode one NAL from the queue de265_error err = DE265_OK; bool did_work = false; if (ctx->nal_parser.get_NAL_queue_length()) { // number_of_NAL_units_pending()) { NAL_unit* nal = ctx->nal_parser.pop_from_NAL_queue(); assert(nal); err = ctx->decode_NAL(nal); // ctx->nal_parser.free_NAL_unit(nal); TODO: do not free NAL with new loop did_work=true; } else if (ctx->nal_parser.is_end_of_frame() == true && ctx->image_units.empty()) { if (more) { *more=1; } return DE265_ERROR_WAITING_FOR_INPUT_DATA; } else { err = decode_some(&did_work); } if (more) { // decoding error is assumed to be unrecoverable *more = (err==DE265_OK && did_work); } return err; } void decoder_context::process_nal_hdr(nal_header* nal) { nal_unit_type = nal->nal_unit_type; IdrPicFlag = isIdrPic(nal->nal_unit_type); RapPicFlag = isRapPic(nal->nal_unit_type); } /* 8.3.1 */ void decoder_context::process_picture_order_count(slice_segment_header* hdr) { loginfo(LogHeaders,"POC computation. lsb:%d prev.pic.lsb:%d msb:%d\n", hdr->slice_pic_order_cnt_lsb, prevPicOrderCntLsb, PicOrderCntMsb); if (isIRAP(nal_unit_type) && NoRaslOutputFlag) { PicOrderCntMsb=0; // flush all images from reorder buffer flush_reorder_buffer_at_this_frame = true; //ctx->dpb.flush_reorder_buffer(); } else { int MaxPicOrderCntLsb = current_sps->MaxPicOrderCntLsb; if ((hdr->slice_pic_order_cnt_lsb < prevPicOrderCntLsb) && (prevPicOrderCntLsb - hdr->slice_pic_order_cnt_lsb) >= MaxPicOrderCntLsb/2) { PicOrderCntMsb = prevPicOrderCntMsb + MaxPicOrderCntLsb; } else if ((hdr->slice_pic_order_cnt_lsb > prevPicOrderCntLsb) && (hdr->slice_pic_order_cnt_lsb - prevPicOrderCntLsb) > MaxPicOrderCntLsb/2) { PicOrderCntMsb = prevPicOrderCntMsb - MaxPicOrderCntLsb; } else { PicOrderCntMsb = prevPicOrderCntMsb; } } img->PicOrderCntVal = PicOrderCntMsb + hdr->slice_pic_order_cnt_lsb; img->picture_order_cnt_lsb = hdr->slice_pic_order_cnt_lsb; loginfo(LogHeaders,"POC computation. new msb:%d POC=%d\n", PicOrderCntMsb, img->PicOrderCntVal); if (img->nal_hdr.nuh_temporal_id==0 && !isSublayerNonReference(nal_unit_type) && !isRASL(nal_unit_type) && !isRADL(nal_unit_type)) { loginfo(LogHeaders,"set prevPicOrderCntLsb/Msb\n"); prevPicOrderCntLsb = hdr->slice_pic_order_cnt_lsb; prevPicOrderCntMsb = PicOrderCntMsb; } } /* 8.3.3.2 Returns DPB index of the generated picture. */ int decoder_context::generate_unavailable_reference_picture(const seq_parameter_set* sps, int POC, bool longTerm) { assert(dpb.has_free_dpb_picture(true)); std::shared_ptr current_sps = this->sps[ (int)current_pps->seq_parameter_set_id ]; int idx = dpb.new_image(current_sps, this, 0,0, false); assert(idx>=0); //printf("-> fill with unavailable POC %d\n",POC); de265_image* img = dpb.get_image(idx); img->fill_image(1<<(sps->BitDepth_Y-1), 1<<(sps->BitDepth_C-1), 1<<(sps->BitDepth_C-1)); img->fill_pred_mode(MODE_INTRA); img->PicOrderCntVal = POC; img->picture_order_cnt_lsb = POC & (sps->MaxPicOrderCntLsb-1); img->PicOutputFlag = false; img->PicState = (longTerm ? UsedForLongTermReference : UsedForShortTermReference); img->integrity = INTEGRITY_UNAVAILABLE_REFERENCE; return idx; } /* 8.3.2 invoked once per picture This function will mark pictures in the DPB as 'unused' or 'used for long-term reference' */ void decoder_context::process_reference_picture_set(slice_segment_header* hdr) { std::vector removeReferencesList; const int currentID = img->get_ID(); if (isIRAP(nal_unit_type) && NoRaslOutputFlag) { int currentPOC = img->PicOrderCntVal; // reset DPB /* The standard says: "When the current picture is an IRAP picture with NoRaslOutputFlag equal to 1, all reference pictures currently in the DPB (if any) are marked as "unused for reference". This seems to be wrong as it also throws out the first CRA picture in a stream like RAP_A (decoding order: CRA,POC=64, RASL,POC=60). Removing only the pictures with lower POCs seems to be compliant to the reference decoder. */ for (int i=0;iPicState != UnusedForReference && img->PicOrderCntVal < currentPOC && img->removed_at_picture_id > img->get_ID()) { removeReferencesList.push_back(img->get_ID()); img->removed_at_picture_id = img->get_ID(); //printf("will remove ID %d (a)\n",img->get_ID()); } } } if (isIDR(nal_unit_type)) { // clear all reference pictures NumPocStCurrBefore = 0; NumPocStCurrAfter = 0; NumPocStFoll = 0; NumPocLtCurr = 0; NumPocLtFoll = 0; } else { const ref_pic_set* rps = &hdr->CurrRps; // (8-98) int i,j,k; // scan ref-pic-set for smaller POCs and fill into PocStCurrBefore / PocStFoll for (i=0, j=0, k=0; iNumNegativePics; i++) { if (rps->UsedByCurrPicS0[i]) { PocStCurrBefore[j++] = img->PicOrderCntVal + rps->DeltaPocS0[i]; //printf("PocStCurrBefore = %d\n",PocStCurrBefore[j-1]); } else { PocStFoll[k++] = img->PicOrderCntVal + rps->DeltaPocS0[i]; } } NumPocStCurrBefore = j; // scan ref-pic-set for larger POCs and fill into PocStCurrAfter / PocStFoll for (i=0, j=0; iNumPositivePics; i++) { if (rps->UsedByCurrPicS1[i]) { PocStCurrAfter[j++] = img->PicOrderCntVal + rps->DeltaPocS1[i]; //printf("PocStCurrAfter = %d\n",PocStCurrAfter[j-1]); } else { PocStFoll[k++] = img->PicOrderCntVal + rps->DeltaPocS1[i]; } } NumPocStCurrAfter = j; NumPocStFoll = k; // find used / future long-term references for (i=0, j=0, k=0; //inum_long_term_ref_pics_sps + hdr->num_long_term_pics; inum_long_term_sps + hdr->num_long_term_pics; i++) { int pocLt = PocLsbLt[i]; if (hdr->delta_poc_msb_present_flag[i]) { int currentPictureMSB = img->PicOrderCntVal - hdr->slice_pic_order_cnt_lsb; pocLt += currentPictureMSB - DeltaPocMsbCycleLt[i] * current_sps->MaxPicOrderCntLsb; } if (UsedByCurrPicLt[i]) { PocLtCurr[j] = pocLt; CurrDeltaPocMsbPresentFlag[j] = hdr->delta_poc_msb_present_flag[i]; j++; } else { PocLtFoll[k] = pocLt; FollDeltaPocMsbPresentFlag[k] = hdr->delta_poc_msb_present_flag[i]; k++; } } NumPocLtCurr = j; NumPocLtFoll = k; } // (old 8-99) / (new 8-106) // 1. std::vector picInAnyList(dpb.size(), false); dpb.log_dpb_content(); for (int i=0;i=0) picInAnyList[k]=true; else { // TODO, CHECK: is it ok that we generate a picture with POC = LSB (PocLtCurr) // We do not know the correct MSB int concealedPicture = generate_unavailable_reference_picture(current_sps.get(), PocLtCurr[i], true); picInAnyList.resize(dpb.size(), false); // adjust size of array to hold new picture RefPicSetLtCurr[i] = k = concealedPicture; picInAnyList[concealedPicture]=true; } if (dpb.get_image(k)->integrity != INTEGRITY_CORRECT) { img->integrity = INTEGRITY_DERIVED_FROM_FAULTY_REFERENCE; } } for (int i=0;i=0) picInAnyList[k]=true; else { int concealedPicture = k = generate_unavailable_reference_picture(current_sps.get(), PocLtFoll[i], true); picInAnyList.resize(dpb.size(), false); // adjust size of array to hold new picture RefPicSetLtFoll[i] = concealedPicture; picInAnyList[concealedPicture]=true; } } // 2. Mark all pictures in RefPicSetLtCurr / RefPicSetLtFoll as UsedForLongTermReference for (int i=0;iPicState = UsedForLongTermReference; } for (int i=0;iPicState = UsedForLongTermReference; } // 3. for (int i=0;i idx=%d\n",PocStCurrBefore[i], k); RefPicSetStCurrBefore[i] = k; // -1 == "no reference picture" if (k>=0) picInAnyList[k]=true; else { int concealedPicture = generate_unavailable_reference_picture(current_sps.get(), PocStCurrBefore[i], false); RefPicSetStCurrBefore[i] = k = concealedPicture; picInAnyList.resize(dpb.size(), false); // adjust size of array to hold new picture picInAnyList[concealedPicture] = true; //printf(" concealed: %d\n", concealedPicture); } if (dpb.get_image(k)->integrity != INTEGRITY_CORRECT) { img->integrity = INTEGRITY_DERIVED_FROM_FAULTY_REFERENCE; } } for (int i=0;i idx=%d\n",PocStCurrAfter[i], k); RefPicSetStCurrAfter[i] = k; // -1 == "no reference picture" if (k>=0) picInAnyList[k]=true; else { int concealedPicture = generate_unavailable_reference_picture(current_sps.get(), PocStCurrAfter[i], false); RefPicSetStCurrAfter[i] = k = concealedPicture; picInAnyList.resize(dpb.size(), false); // adjust size of array to hold new picture picInAnyList[concealedPicture]=true; //printf(" concealed: %d\n", concealedPicture); } if (dpb.get_image(k)->integrity != INTEGRITY_CORRECT) { img->integrity = INTEGRITY_DERIVED_FROM_FAULTY_REFERENCE; } } for (int i=0;i=0) picInAnyList[k]=true; } // 4. any picture that is not marked for reference is put into the "UnusedForReference" state for (int i=0;i=picInAnyList.size() || !picInAnyList[i]) // no reference { de265_image* dpbimg = dpb.get_image(i); if (dpbimg != img && // not the current picture dpbimg->removed_at_picture_id > img->get_ID()) // has not been removed before { if (dpbimg->PicState != UnusedForReference) { removeReferencesList.push_back(dpbimg->get_ID()); //printf("will remove ID %d (b)\n",dpbimg->get_ID()); dpbimg->removed_at_picture_id = img->get_ID(); } } } hdr->RemoveReferencesList = removeReferencesList; //remove_images_from_dpb(hdr->RemoveReferencesList); } // 8.3.4 // Returns whether we can continue decoding (or whether there is a severe error). /* Called at beginning of each slice. Constructs - the RefPicList[2][], containing indices into the DPB, and - the RefPicList_POC[2][], containing POCs. - LongTermRefPic[2][] is also set to true if it is a long-term reference */ bool decoder_context::construct_reference_picture_lists(slice_segment_header* hdr) { int NumPocTotalCurr = hdr->NumPocTotalCurr; int NumRpsCurrTempList0 = libde265_max(hdr->num_ref_idx_l0_active, NumPocTotalCurr); // TODO: fold code for both lists together int RefPicListTemp0[3*MAX_NUM_REF_PICS]; // TODO: what would be the correct maximum ? int RefPicListTemp1[3*MAX_NUM_REF_PICS]; // TODO: what would be the correct maximum ? char isLongTerm[2][3*MAX_NUM_REF_PICS]; memset(isLongTerm,0,2*3*MAX_NUM_REF_PICS); /* --- Fill RefPicListTmp0 with reference pictures in this order: 1) short term, past POC 2) short term, future POC 3) long term */ int rIdx=0; while (rIdx < NumRpsCurrTempList0) { for (int i=0;inum_ref_idx_l0_active > 16) { add_warning(DE265_WARNING_NONEXISTING_REFERENCE_PICTURE_ACCESSED, false); return false; } */ assert(hdr->num_ref_idx_l0_active <= 16); for (rIdx=0; rIdxnum_ref_idx_l0_active; rIdx++) { int idx = hdr->ref_pic_list_modification_flag_l0 ? hdr->list_entry_l0[rIdx] : rIdx; hdr->RefPicList[0][rIdx] = RefPicListTemp0[idx]; hdr->LongTermRefPic[0][rIdx] = isLongTerm[0][idx]; // remember POC of referenced image (needed in motion.c, derive_collocated_motion_vector) de265_image* img_0_rIdx = dpb.get_image(hdr->RefPicList[0][rIdx]); if (img_0_rIdx==NULL) { return false; } hdr->RefPicList_POC[0][rIdx] = img_0_rIdx->PicOrderCntVal; hdr->RefPicList_PicState[0][rIdx] = img_0_rIdx->PicState; } /* --- Fill RefPicListTmp1 with reference pictures in this order: 1) short term, future POC 2) short term, past POC 3) long term */ if (hdr->slice_type == SLICE_TYPE_B) { int NumRpsCurrTempList1 = libde265_max(hdr->num_ref_idx_l1_active, NumPocTotalCurr); int rIdx=0; while (rIdx < NumRpsCurrTempList1) { for (int i=0;inum_ref_idx_l0_active > 16) { add_warning(DE265_WARNING_NONEXISTING_REFERENCE_PICTURE_ACCESSED, false); return false; } assert(hdr->num_ref_idx_l1_active <= 16); for (rIdx=0; rIdxnum_ref_idx_l1_active; rIdx++) { int idx = hdr->ref_pic_list_modification_flag_l1 ? hdr->list_entry_l1[rIdx] : rIdx; hdr->RefPicList[1][rIdx] = RefPicListTemp1[idx]; hdr->LongTermRefPic[1][rIdx] = isLongTerm[1][idx]; // remember POC of referenced imaged (needed in motion.c, derive_collocated_motion_vector) de265_image* img_1_rIdx = dpb.get_image(hdr->RefPicList[1][rIdx]); if (img_1_rIdx == NULL) { return false; } hdr->RefPicList_POC[1][rIdx] = img_1_rIdx->PicOrderCntVal; hdr->RefPicList_PicState[1][rIdx] = img_1_rIdx->PicState; } } // show reference picture lists loginfo(LogHeaders,"RefPicList[0] ="); for (rIdx=0; rIdxnum_ref_idx_l0_active; rIdx++) { loginfo(LogHeaders,"* [%d]=%d (LT=%d)", hdr->RefPicList[0][rIdx], hdr->RefPicList_POC[0][rIdx], hdr->LongTermRefPic[0][rIdx] ); } loginfo(LogHeaders,"*\n"); if (hdr->slice_type == SLICE_TYPE_B) { loginfo(LogHeaders,"RefPicList[1] ="); for (rIdx=0; rIdxnum_ref_idx_l1_active; rIdx++) { loginfo(LogHeaders,"* [%d]=%d (LT=%d)", hdr->RefPicList[1][rIdx], hdr->RefPicList_POC[1][rIdx], hdr->LongTermRefPic[1][rIdx] ); } loginfo(LogHeaders,"*\n"); } return true; } void decoder_context::run_postprocessing_filters_sequential(de265_image* img) { #if SAVE_INTERMEDIATE_IMAGES char buf[1000]; sprintf(buf,"pre-lf-%05d.yuv", img->PicOrderCntVal); write_picture_to_file(img, buf); #endif if (!img->decctx->param_disable_deblocking) { apply_deblocking_filter(img); } #if SAVE_INTERMEDIATE_IMAGES sprintf(buf,"pre-sao-%05d.yuv", img->PicOrderCntVal); write_picture_to_file(img, buf); #endif if (!img->decctx->param_disable_sao) { apply_sample_adaptive_offset_sequential(img); } #if SAVE_INTERMEDIATE_IMAGES sprintf(buf,"sao-%05d.yuv", img->PicOrderCntVal); write_picture_to_file(img, buf); #endif } void decoder_context::run_postprocessing_filters_parallel(image_unit* imgunit) { de265_image* img = imgunit->img; int saoWaitsForProgress = CTB_PROGRESS_PREFILTER; bool waitForCompletion = false; if (!img->decctx->param_disable_deblocking) { add_deblocking_tasks(imgunit); saoWaitsForProgress = CTB_PROGRESS_DEBLK_H; } if (!img->decctx->param_disable_sao) { waitForCompletion |= add_sao_tasks(imgunit, saoWaitsForProgress); //apply_sample_adaptive_offset(img); } img->wait_for_completion(); } /* void decoder_context::push_current_picture_to_output_queue() { push_picture_to_output_queue(img); } */ de265_error decoder_context::push_picture_to_output_queue(image_unit* imgunit) { de265_image* outimg = imgunit->img; if (outimg==NULL) { return DE265_OK; } // push image into output queue if (outimg->PicOutputFlag) { loginfo(LogDPB,"new picture has output-flag=true\n"); if (outimg->integrity != INTEGRITY_CORRECT && param_suppress_faulty_pictures) { } else { dpb.insert_image_into_reorder_buffer(outimg); } loginfo(LogDPB,"push image %d into reordering queue\n", outimg->PicOrderCntVal); } // check for full reorder buffers int maxNumPicsInReorderBuffer = 0; // TODO: I'd like to have the has_vps() check somewhere else (not decode the picture at all) if (outimg->has_vps()) { int sublayer = outimg->get_vps().vps_max_sub_layers -1; maxNumPicsInReorderBuffer = outimg->get_vps().layer[sublayer].vps_max_num_reorder_pics; } if (dpb.num_pictures_in_reorder_buffer() > maxNumPicsInReorderBuffer) { dpb.output_next_picture_in_reorder_buffer(); } dpb.log_dpb_queues(); return DE265_OK; } // returns whether we can continue decoding the stream or whether we should give up bool decoder_context::process_slice_segment_header(slice_segment_header* hdr, de265_error* err, de265_PTS pts, nal_header* nal_hdr, void* user_data) { *err = DE265_OK; flush_reorder_buffer_at_this_frame = false; // get PPS and SPS for this slice int pps_id = hdr->slice_pic_parameter_set_id; if (pps[pps_id]->pps_read==false) { logerror(LogHeaders, "PPS %d has not been read\n", pps_id); assert(false); // TODO } current_pps = pps[pps_id]; current_sps = sps[ (int)current_pps->seq_parameter_set_id ]; current_vps = vps[ (int)current_sps->video_parameter_set_id ]; calc_tid_and_framerate_ratio(); // --- prepare decoding of new picture --- if (hdr->first_slice_segment_in_pic_flag) { // previous picture has been completely decoded //ctx->push_current_picture_to_output_queue(); current_image_poc_lsb = hdr->slice_pic_order_cnt_lsb; seq_parameter_set* sps = current_sps.get(); // --- find and allocate image buffer for decoding --- int image_buffer_idx; bool isOutputImage = (!sps->sample_adaptive_offset_enabled_flag || param_disable_sao); image_buffer_idx = dpb.new_image(current_sps, this, pts, user_data, isOutputImage); if (image_buffer_idx == -1) { *err = DE265_ERROR_IMAGE_BUFFER_FULL; return false; } /*de265_image* */ img = dpb.get_image(image_buffer_idx); img->nal_hdr = *nal_hdr; // Note: sps is already set in new_image() -> ??? still the case with shared_ptr ? img->set_headers(current_vps, current_sps, current_pps); img->decctx = this; img->clear_metadata(); if (isIRAP(nal_unit_type)) { if (isIDR(nal_unit_type) || isBLA(nal_unit_type) || first_decoded_picture || FirstAfterEndOfSequenceNAL) { NoRaslOutputFlag = true; FirstAfterEndOfSequenceNAL = false; } else if (0) // TODO: set HandleCraAsBlaFlag by external means { } else { NoRaslOutputFlag = false; HandleCraAsBlaFlag = false; } } if (isRASL(nal_unit_type) && NoRaslOutputFlag) { img->PicOutputFlag = false; } else { img->PicOutputFlag = !!hdr->pic_output_flag; } process_picture_order_count(hdr); if (hdr->first_slice_segment_in_pic_flag) { // mark picture so that it is not overwritten by unavailable reference frames img->PicState = UsedForShortTermReference; process_reference_picture_set(hdr); } img->PicState = UsedForShortTermReference; log_set_current_POC(img->PicOrderCntVal); // next image is not the first anymore first_decoded_picture = false; } else { // claims to be not the first slice, but there is no active image available if (img == NULL) { return false; } } if (hdr->slice_type == SLICE_TYPE_B || hdr->slice_type == SLICE_TYPE_P) { bool success = construct_reference_picture_lists(hdr); if (!success) { return false; } } //printf("process slice segment header\n"); loginfo(LogHeaders,"end of process-slice-header\n"); dpb.log_dpb_content(); if (hdr->dependent_slice_segment_flag==0) { hdr->SliceAddrRS = hdr->slice_segment_address; } else { hdr->SliceAddrRS = previous_slice_header->SliceAddrRS; } previous_slice_header = hdr; loginfo(LogHeaders,"SliceAddrRS = %d\n",hdr->SliceAddrRS); return true; } void decoder_context::remove_images_from_dpb(const std::vector& removeImageList) { for (int i=0;i=0) { //printf("remove ID %d\n", removeImageList[i]); de265_image* dpbimg = dpb.get_image( idx ); dpbimg->PicState = UnusedForReference; } } } /* . 0 1 2 <- goal_HighestTid +-----+-----+-----+ | -0->| -1->| -2->| +-----+-----+-----+ 0 33 66 100 <- framerate_ratio */ int decoder_context::get_highest_TID() const { if (current_sps) { return current_sps->sps_max_sub_layers-1; } if (current_vps) { return current_vps->vps_max_sub_layers-1; } return 6; } void decoder_context::set_limit_TID(int max_tid) { limit_HighestTid = max_tid; calc_tid_and_framerate_ratio(); } int decoder_context::change_framerate(int more) { if (current_sps == NULL) { return framerate_ratio; } int highestTid = get_highest_TID(); assert(more>=-1 && more<=1); goal_HighestTid += more; goal_HighestTid = std::max(goal_HighestTid, 0); goal_HighestTid = std::min(goal_HighestTid, highestTid); framerate_ratio = framedrop_tid_index[goal_HighestTid]; calc_tid_and_framerate_ratio(); return framerate_ratio; } void decoder_context::set_framerate_ratio(int percent) { framerate_ratio = percent; calc_tid_and_framerate_ratio(); } void decoder_context::compute_framedrop_table() { int highestTID = get_highest_TID(); for (int tid=highestTID ; tid>=0 ; tid--) { int lower = 100 * tid /(highestTID+1); int higher = 100 * (tid+1)/(highestTID+1); for (int l=lower; l<=higher; l++) { int ratio = 100 * (l-lower) / (higher-lower); // if we would exceed our TID limit, decode the highest TID at full frame-rate if (tid > limit_HighestTid) { tid = limit_HighestTid; ratio = 100; } framedrop_tab[l].tid = tid; framedrop_tab[l].ratio = ratio; } framedrop_tid_index[tid] = higher; } #if 0 for (int i=0;i<=100;i++) { printf("%d%%: %d/%d",i, framedrop_tab[i].tid, framedrop_tab[i].ratio); for (int k=0;k<=highestTID;k++) { if (framedrop_tid_index[k] == i) printf(" ** TID=%d **",k); } printf("\n"); } #endif } void decoder_context::calc_tid_and_framerate_ratio() { int highestTID = get_highest_TID(); // if number of temporal layers changed, we have to recompute the framedrop table if (framedrop_tab[100].tid != highestTID) { compute_framedrop_table(); } goal_HighestTid = framedrop_tab[framerate_ratio].tid; layer_framerate_ratio = framedrop_tab[framerate_ratio].ratio; // TODO: for now, we switch immediately current_HighestTid = goal_HighestTid; } void error_queue::add_warning(de265_error warning, bool once) { // check if warning was already shown bool add=true; if (once) { for (int i=0;i