content/common/gpu/media/vt_video_decode_accelerator.cc - chromium/src - Git at Google

 // Copyright 2014 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include <algorithm>

 #include <CoreVideo/CoreVideo.h>
 #include <OpenGL/CGLIOSurface.h>
 #include <OpenGL/gl.h>

 #include "base/bind.h"
 #include "base/command_line.h"
 #include "base/logging.h"
 #include "base/mac/mac_logging.h"
 #include "base/sys_byteorder.h"
 #include "base/thread_task_runner_handle.h"
 #include "content/common/gpu/media/vt_video_decode_accelerator.h"
 #include "content/public/common/content_switches.h"
 #include "media/base/limits.h"
 #include "ui/gl/scoped_binders.h"

 using content_common_gpu_media::kModuleVt;
 using content_common_gpu_media::InitializeStubs;
 using content_common_gpu_media::IsVtInitialized;
 using content_common_gpu_media::StubPathMap;

 #define NOTIFY_STATUS(name, status)          \
     do {                                     \
       OSSTATUS_DLOG(ERROR, status) << name;  \
       NotifyError(PLATFORM_FAILURE);         \
     } while (0)

 namespace content {

 // Size to use for NALU length headers in AVC format (can be 1, 2, or 4).
 static const int kNALUHeaderLength = 4;

 // We request 5 picture buffers from the client, each of which has a texture ID
 // that we can bind decoded frames to. We need enough to satisfy preroll, and
 // enough to avoid unnecessary stalling, but no more than that. The resource
 // requirements are low, as we don't need the textures to be backed by storage.
 static const int kNumPictureBuffers = media::limits::kMaxVideoFrames + 1;

 // Maximum number of frames to queue for reordering before we stop asking for
 // more. (NotifyEndOfBitstreamBuffer() is called when frames are moved into the
 // reorder queue.)
 static const int kMaxReorderQueueSize = 16;

 // Build an |image_config| dictionary for VideoToolbox initialization.
 static base::ScopedCFTypeRef<CFMutableDictionaryRef>
 BuildImageConfig(CMVideoDimensions coded_dimensions) {
   // TODO(sandersd): RGBA option for 4:4:4 video.
   int32_t pixel_format = kCVPixelFormatType_422YpCbCr8;

 #define CFINT(i) CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &i)
   base::ScopedCFTypeRef<CFNumberRef> cf_pixel_format(CFINT(pixel_format));
   base::ScopedCFTypeRef<CFNumberRef> cf_width(CFINT(coded_dimensions.width));
   base::ScopedCFTypeRef<CFNumberRef> cf_height(CFINT(coded_dimensions.height));
 #undef CFINT

   base::ScopedCFTypeRef<CFMutableDictionaryRef> image_config(
       CFDictionaryCreateMutable(
           kCFAllocatorDefault,
           4,  // capacity
           &kCFTypeDictionaryKeyCallBacks,
           &kCFTypeDictionaryValueCallBacks));
   CFDictionarySetValue(image_config, kCVPixelBufferPixelFormatTypeKey,
                        cf_pixel_format);
   CFDictionarySetValue(image_config, kCVPixelBufferWidthKey, cf_width);
   CFDictionarySetValue(image_config, kCVPixelBufferHeightKey, cf_height);
   CFDictionarySetValue(image_config, kCVPixelBufferOpenGLCompatibilityKey,
                        kCFBooleanTrue);

   return image_config;
 }

 // The purpose of this function is to preload the generic and hardware-specific
 // libraries required by VideoToolbox before the GPU sandbox is enabled.
 // VideoToolbox normally loads the hardware-specific libraries lazily, so we
 // must actually create a decompression session.
 //
 // If creating a decompression session fails, hardware decoding will be disabled
 // (Initialize() will always return false). If it succeeds but a required
 // library is not loaded yet (I have not experienced this, but the details are
 // not documented), then VideoToolbox will fall back on software decoding
 // internally. If that happens, the likely solution is to expand the scope of
 // this initialization.
 void InitializeVideoToolbox() {
   if (base::CommandLine::ForCurrentProcess()->HasSwitch(
       switches::kDisableAcceleratedVideoDecode)) {
     return;
   }

   if (!IsVtInitialized()) {
     // CoreVideo is also required, but the loader stops after the first path is
     // loaded. Instead we rely on the transitive dependency from VideoToolbox to
     // CoreVideo.
     // TODO(sandersd): Fallback to PrivateFrameworks to support OS X < 10.8.
     StubPathMap paths;
     paths[kModuleVt].push_back(FILE_PATH_LITERAL(
         "/System/Library/Frameworks/VideoToolbox.framework/VideoToolbox"));
     if (!InitializeStubs(paths))
       return;
   }

   // Create a decoding session.
   // SPS and PPS data were taken from the 480p encoding of Big Buck Bunny.
   const uint8_t sps[] = {0x67, 0x64, 0x00, 0x1e, 0xac, 0xd9, 0x80, 0xd4, 0x3d,
                          0xa1, 0x00, 0x00, 0x03, 0x00, 0x01, 0x00, 0x00, 0x03,
                          0x00, 0x30, 0x8f, 0x16, 0x2d, 0x9a};
   const uint8_t pps[] = {0x68, 0xe9, 0x7b, 0xcb};
   const uint8_t* data_ptrs[] = {sps, pps};
   const size_t data_sizes[] = {arraysize(sps), arraysize(pps)};

   base::ScopedCFTypeRef<CMFormatDescriptionRef> format;
   OSStatus status = CMVideoFormatDescriptionCreateFromH264ParameterSets(
       kCFAllocatorDefault,
       2,                          // parameter_set_count
       data_ptrs,                  // &parameter_set_pointers
       data_sizes,                 // &parameter_set_sizes
       kNALUHeaderLength,          // nal_unit_header_length
       format.InitializeInto());
   if (status) {
     OSSTATUS_LOG(ERROR, status) << "Failed to create CMVideoFormatDescription "
                                 << "while initializing VideoToolbox";
     content_common_gpu_media::UninitializeVt();
     return;
   }

   base::ScopedCFTypeRef<CFMutableDictionaryRef> decoder_config(
       CFDictionaryCreateMutable(
           kCFAllocatorDefault,
           1,  // capacity
           &kCFTypeDictionaryKeyCallBacks,
           &kCFTypeDictionaryValueCallBacks));

   CFDictionarySetValue(
       decoder_config,
       // kVTVideoDecoderSpecification_RequireHardwareAcceleratedVideoDecoder
       CFSTR("RequireHardwareAcceleratedVideoDecoder"),
       kCFBooleanTrue);

   base::ScopedCFTypeRef<CFMutableDictionaryRef> image_config(
       BuildImageConfig(CMVideoFormatDescriptionGetDimensions(format)));

   VTDecompressionOutputCallbackRecord callback = {0};

   base::ScopedCFTypeRef<VTDecompressionSessionRef> session;
   status = VTDecompressionSessionCreate(
       kCFAllocatorDefault,
       format,               // video_format_description
       decoder_config,       // video_decoder_specification
       image_config,         // destination_image_buffer_attributes
       &callback,            // output_callback
       session.InitializeInto());
   if (status) {
     OSSTATUS_LOG(ERROR, status) << "Failed to create VTDecompressionSession "
                                 << "while initializing VideoToolbox";
     content_common_gpu_media::UninitializeVt();
     return;
   }
 }

 // Route decoded frame callbacks back into the VTVideoDecodeAccelerator.
 static void OutputThunk(
     void* decompression_output_refcon,
     void* source_frame_refcon,
     OSStatus status,
     VTDecodeInfoFlags info_flags,
     CVImageBufferRef image_buffer,
     CMTime presentation_time_stamp,
     CMTime presentation_duration) {
   VTVideoDecodeAccelerator* vda =
       reinterpret_cast<VTVideoDecodeAccelerator*>(decompression_output_refcon);
   vda->Output(source_frame_refcon, status, image_buffer);
 }

 VTVideoDecodeAccelerator::Task::Task(TaskType type) : type(type) {
 }

 VTVideoDecodeAccelerator::Task::~Task() {
 }

 VTVideoDecodeAccelerator::Frame::Frame(int32_t bitstream_id)
     : bitstream_id(bitstream_id), pic_order_cnt(0), reorder_window(0) {
 }

 VTVideoDecodeAccelerator::Frame::~Frame() {
 }

 bool VTVideoDecodeAccelerator::FrameOrder::operator()(
     const linked_ptr<Frame>& lhs,
     const linked_ptr<Frame>& rhs) const {
   if (lhs->pic_order_cnt != rhs->pic_order_cnt)
     return lhs->pic_order_cnt > rhs->pic_order_cnt;
   // If |pic_order_cnt| is the same, fall back on using the bitstream order.
   // TODO(sandersd): Assign a sequence number in Decode() and use that instead.
   // TODO(sandersd): Using the sequence number, ensure that frames older than
   // |kMaxReorderQueueSize| are ordered first, regardless of |pic_order_cnt|.
   return lhs->bitstream_id > rhs->bitstream_id;
 }

 VTVideoDecodeAccelerator::VTVideoDecodeAccelerator(
     CGLContextObj cgl_context,
     const base::Callback<bool(void)>& make_context_current)
     : cgl_context_(cgl_context),
       make_context_current_(make_context_current),
       client_(NULL),
       state_(STATE_DECODING),
       format_(NULL),
       session_(NULL),
       last_sps_id_(-1),
       last_pps_id_(-1),
       gpu_task_runner_(base::ThreadTaskRunnerHandle::Get()),
       decoder_thread_("VTDecoderThread"),
       weak_this_factory_(this) {
   DCHECK(!make_context_current_.is_null());
   callback_.decompressionOutputCallback = OutputThunk;
   callback_.decompressionOutputRefCon = this;
   weak_this_ = weak_this_factory_.GetWeakPtr();
 }

 VTVideoDecodeAccelerator::~VTVideoDecodeAccelerator() {
 }

 bool VTVideoDecodeAccelerator::Initialize(
     media::VideoCodecProfile profile,
     Client* client) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   client_ = client;

   if (!IsVtInitialized())
     return false;

   // Only H.264 is supported.
   if (profile < media::H264PROFILE_MIN || profile > media::H264PROFILE_MAX)
     return false;

   // Spawn a thread to handle parsing and calling VideoToolbox.
   if (!decoder_thread_.Start())
     return false;

   return true;
 }

 bool VTVideoDecodeAccelerator::FinishDelayedFrames() {
   DCHECK(decoder_thread_.message_loop_proxy()->BelongsToCurrentThread());
   if (session_) {
     OSStatus status = VTDecompressionSessionFinishDelayedFrames(session_);
     if (status) {
       NOTIFY_STATUS("VTDecompressionSessionFinishDelayedFrames()", status);
       return false;
     }
   }
   return true;
 }

 bool VTVideoDecodeAccelerator::ConfigureDecoder() {
   DCHECK(decoder_thread_.message_loop_proxy()->BelongsToCurrentThread());
   DCHECK(!last_sps_.empty());
   DCHECK(!last_pps_.empty());

   // Build the configuration records.
   std::vector<const uint8_t*> nalu_data_ptrs;
   std::vector<size_t> nalu_data_sizes;
   nalu_data_ptrs.reserve(3);
   nalu_data_sizes.reserve(3);
   nalu_data_ptrs.push_back(&last_sps_.front());
   nalu_data_sizes.push_back(last_sps_.size());
   if (!last_spsext_.empty()) {
     nalu_data_ptrs.push_back(&last_spsext_.front());
     nalu_data_sizes.push_back(last_spsext_.size());
   }
   nalu_data_ptrs.push_back(&last_pps_.front());
   nalu_data_sizes.push_back(last_pps_.size());

   // Construct a new format description from the parameter sets.
   // TODO(sandersd): Replace this with custom code to support OS X < 10.9.
   format_.reset();
   OSStatus status = CMVideoFormatDescriptionCreateFromH264ParameterSets(
       kCFAllocatorDefault,
       nalu_data_ptrs.size(),      // parameter_set_count
       &nalu_data_ptrs.front(),    // &parameter_set_pointers
       &nalu_data_sizes.front(),   // &parameter_set_sizes
       kNALUHeaderLength,          // nal_unit_header_length
       format_.InitializeInto());
   if (status) {
     NOTIFY_STATUS("CMVideoFormatDescriptionCreateFromH264ParameterSets()",
                   status);
     return false;
   }

   // Store the new configuration data.
   CMVideoDimensions coded_dimensions =
       CMVideoFormatDescriptionGetDimensions(format_);
   coded_size_.SetSize(coded_dimensions.width, coded_dimensions.height);

   // If the session is compatible, there's nothing else to do.
   if (session_ &&
       VTDecompressionSessionCanAcceptFormatDescription(session_, format_)) {
     return true;
   }

   // Prepare VideoToolbox configuration dictionaries.
   base::ScopedCFTypeRef<CFMutableDictionaryRef> decoder_config(
       CFDictionaryCreateMutable(
           kCFAllocatorDefault,
           1,  // capacity
           &kCFTypeDictionaryKeyCallBacks,
           &kCFTypeDictionaryValueCallBacks));

   CFDictionarySetValue(
       decoder_config,
       // kVTVideoDecoderSpecification_EnableHardwareAcceleratedVideoDecoder
       CFSTR("EnableHardwareAcceleratedVideoDecoder"),
       kCFBooleanTrue);

   base::ScopedCFTypeRef<CFMutableDictionaryRef> image_config(
       BuildImageConfig(coded_dimensions));

   // TODO(sandersd): Does the old session need to be flushed first?
   session_.reset();
   status = VTDecompressionSessionCreate(
       kCFAllocatorDefault,
       format_,              // video_format_description
       decoder_config,       // video_decoder_specification
       image_config,         // destination_image_buffer_attributes
       &callback_,           // output_callback
       session_.InitializeInto());
   if (status) {
     NOTIFY_STATUS("VTDecompressionSessionCreate()", status);
     return false;
   }

   return true;
 }

 void VTVideoDecodeAccelerator::DecodeTask(
     const media::BitstreamBuffer& bitstream,
     Frame* frame) {
   DCHECK(decoder_thread_.message_loop_proxy()->BelongsToCurrentThread());

   // Map the bitstream buffer.
   base::SharedMemory memory(bitstream.handle(), true);
   size_t size = bitstream.size();
   if (!memory.Map(size)) {
     DLOG(ERROR) << "Failed to map bitstream buffer";
     NotifyError(PLATFORM_FAILURE);
     return;
   }
   const uint8_t* buf = static_cast<uint8_t*>(memory.memory());

   // NALUs are stored with Annex B format in the bitstream buffer (start codes),
   // but VideoToolbox expects AVC format (length headers), so we must rewrite
   // the data.
   //
   // Locate relevant NALUs and compute the size of the rewritten data. Also
   // record any parameter sets for VideoToolbox initialization.
   bool config_changed = false;
   size_t data_size = 0;
   std::vector<media::H264NALU> nalus;
   parser_.SetStream(buf, size);
   media::H264NALU nalu;
   while (true) {
     media::H264Parser::Result result = parser_.AdvanceToNextNALU(&nalu);
     if (result == media::H264Parser::kEOStream)
       break;
     if (result != media::H264Parser::kOk) {
       DLOG(ERROR) << "Failed to find H.264 NALU";
       NotifyError(UNREADABLE_INPUT);
       return;
     }
     switch (nalu.nal_unit_type) {
       case media::H264NALU::kSPS:
         last_sps_.assign(nalu.data, nalu.data + nalu.size);
         last_spsext_.clear();
         config_changed = true;
         if (parser_.ParseSPS(&last_sps_id_) != media::H264Parser::kOk) {
           DLOG(ERROR) << "Could not parse SPS";
           NotifyError(UNREADABLE_INPUT);
           return;
         }
         break;

       case media::H264NALU::kSPSExt:
         // TODO(sandersd): Check that the previous NALU was an SPS.
         last_spsext_.assign(nalu.data, nalu.data + nalu.size);
         config_changed = true;
         break;

       case media::H264NALU::kPPS:
         last_pps_.assign(nalu.data, nalu.data + nalu.size);
         config_changed = true;
         if (parser_.ParsePPS(&last_pps_id_) != media::H264Parser::kOk) {
           DLOG(ERROR) << "Could not parse PPS";
           NotifyError(UNREADABLE_INPUT);
           return;
         }
         break;

       case media::H264NALU::kSliceDataA:
       case media::H264NALU::kSliceDataB:
       case media::H264NALU::kSliceDataC:
         DLOG(ERROR) << "Coded slide data partitions not implemented.";
         NotifyError(PLATFORM_FAILURE);
         return;

       case media::H264NALU::kNonIDRSlice:
         // TODO(sandersd): Check that there has been an IDR slice since the
         // last reset.
       case media::H264NALU::kIDRSlice:
         {
           // TODO(sandersd): Make sure this only happens once per frame.
           DCHECK_EQ(frame->pic_order_cnt, 0);

           media::H264SliceHeader slice_hdr;
           result = parser_.ParseSliceHeader(nalu, &slice_hdr);
           if (result != media::H264Parser::kOk) {
             DLOG(ERROR) << "Could not parse slice header";
             NotifyError(UNREADABLE_INPUT);
             return;
           }

           // TODO(sandersd): Maintain a cache of configurations and reconfigure
           // only when a slice references a new config.
           DCHECK_EQ(slice_hdr.pic_parameter_set_id, last_pps_id_);
           const media::H264PPS* pps =
               parser_.GetPPS(slice_hdr.pic_parameter_set_id);
           if (!pps) {
             DLOG(ERROR) << "Mising PPS referenced by slice";
             NotifyError(UNREADABLE_INPUT);
             return;
           }

           DCHECK_EQ(pps->seq_parameter_set_id, last_sps_id_);
           const media::H264SPS* sps = parser_.GetSPS(pps->seq_parameter_set_id);
           if (!sps) {
             DLOG(ERROR) << "Mising SPS referenced by PPS";
             NotifyError(UNREADABLE_INPUT);
             return;
           }

           if (!poc_.ComputePicOrderCnt(sps, slice_hdr, &frame->pic_order_cnt)) {
             NotifyError(UNREADABLE_INPUT);
             return;
           }

           if (sps->vui_parameters_present_flag &&
               sps->bitstream_restriction_flag) {
             frame->reorder_window = std::min(sps->max_num_reorder_frames,
                                              kMaxReorderQueueSize - 1);
           }
         }
       default:
         nalus.push_back(nalu);
         data_size += kNALUHeaderLength + nalu.size;
         break;
     }
   }

   // Initialize VideoToolbox.
   // TODO(sandersd): Instead of assuming that the last SPS and PPS units are
   // always the correct ones, maintain a cache of recent SPS and PPS units and
   // select from them using the slice header.
   if (config_changed) {
     if (last_sps_.size() == 0 || last_pps_.size() == 0) {
       DLOG(ERROR) << "Invalid configuration data";
       NotifyError(INVALID_ARGUMENT);
       return;
     }
     if (!ConfigureDecoder())
       return;
   }

   // If there are no non-configuration units, drop the bitstream buffer by
   // returning an empty frame.
   if (!data_size) {
     if (!FinishDelayedFrames())
       return;
     gpu_task_runner_->PostTask(FROM_HERE, base::Bind(
         &VTVideoDecodeAccelerator::DecodeDone, weak_this_, frame));
     return;
   }

   // If the session is not configured by this point, fail.
   if (!session_) {
     DLOG(ERROR) << "Image slice without configuration";
     NotifyError(INVALID_ARGUMENT);
     return;
   }

   // Update the frame metadata with configuration data.
   frame->coded_size = coded_size_;

   // Create a memory-backed CMBlockBuffer for the translated data.
   // TODO(sandersd): Pool of memory blocks.
   base::ScopedCFTypeRef<CMBlockBufferRef> data;
   OSStatus status = CMBlockBufferCreateWithMemoryBlock(
       kCFAllocatorDefault,
       NULL,                 // &memory_block
       data_size,            // block_length
       kCFAllocatorDefault,  // block_allocator
       NULL,                 // &custom_block_source
       0,                    // offset_to_data
       data_size,            // data_length
       0,                    // flags
       data.InitializeInto());
   if (status) {
     NOTIFY_STATUS("CMBlockBufferCreateWithMemoryBlock()", status);
     return;
   }

   // Copy NALU data into the CMBlockBuffer, inserting length headers.
   size_t offset = 0;
   for (size_t i = 0; i < nalus.size(); i++) {
     media::H264NALU& nalu = nalus[i];
     uint32_t header = base::HostToNet32(static_cast<uint32_t>(nalu.size));
     status = CMBlockBufferReplaceDataBytes(
         &header, data, offset, kNALUHeaderLength);
     if (status) {
       NOTIFY_STATUS("CMBlockBufferReplaceDataBytes()", status);
       return;
     }
     offset += kNALUHeaderLength;
     status = CMBlockBufferReplaceDataBytes(nalu.data, data, offset, nalu.size);
     if (status) {
       NOTIFY_STATUS("CMBlockBufferReplaceDataBytes()", status);
       return;
     }
     offset += nalu.size;
   }

   // Package the data in a CMSampleBuffer.
   base::ScopedCFTypeRef<CMSampleBufferRef> sample;
   status = CMSampleBufferCreate(
       kCFAllocatorDefault,
       data,                 // data_buffer
       true,                 // data_ready
       NULL,                 // make_data_ready_callback
       NULL,                 // make_data_ready_refcon
       format_,              // format_description
       1,                    // num_samples
       0,                    // num_sample_timing_entries
       NULL,                 // &sample_timing_array
       0,                    // num_sample_size_entries
       NULL,                 // &sample_size_array
       sample.InitializeInto());
   if (status) {
     NOTIFY_STATUS("CMSampleBufferCreate()", status);
     return;
   }

   // Send the frame for decoding.
   // Asynchronous Decompression allows for parallel submission of frames
   // (without it, DecodeFrame() does not return until the frame has been
   // decoded). We don't enable Temporal Processing so that frames are always
   // returned in decode order; this makes it easier to avoid deadlock.
   VTDecodeFrameFlags decode_flags =
       kVTDecodeFrame_EnableAsynchronousDecompression;
   status = VTDecompressionSessionDecodeFrame(
       session_,
       sample,                                 // sample_buffer
       decode_flags,                           // decode_flags
       reinterpret_cast<void*>(frame),         // source_frame_refcon
       NULL);                                  // &info_flags_out
   if (status) {
     NOTIFY_STATUS("VTDecompressionSessionDecodeFrame()", status);
     return;
   }
 }

 // This method may be called on any VideoToolbox thread.
 void VTVideoDecodeAccelerator::Output(
     void* source_frame_refcon,
     OSStatus status,
     CVImageBufferRef image_buffer) {
   if (status) {
     NOTIFY_STATUS("Decoding", status);
   } else if (CFGetTypeID(image_buffer) != CVPixelBufferGetTypeID()) {
     DLOG(ERROR) << "Decoded frame is not a CVPixelBuffer";
     NotifyError(PLATFORM_FAILURE);
   } else {
     Frame* frame = reinterpret_cast<Frame*>(source_frame_refcon);
     frame->image.reset(image_buffer, base::scoped_policy::RETAIN);
     gpu_task_runner_->PostTask(FROM_HERE, base::Bind(
         &VTVideoDecodeAccelerator::DecodeDone, weak_this_, frame));
   }
 }

 void VTVideoDecodeAccelerator::DecodeDone(Frame* frame) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(1u, pending_frames_.count(frame->bitstream_id));
   Task task(TASK_FRAME);
   task.frame = pending_frames_[frame->bitstream_id];
   pending_frames_.erase(frame->bitstream_id);
   task_queue_.push(task);
   ProcessWorkQueues();
 }

 void VTVideoDecodeAccelerator::FlushTask(TaskType type) {
   DCHECK(decoder_thread_.message_loop_proxy()->BelongsToCurrentThread());
   FinishDelayedFrames();

   // Always queue a task, even if FinishDelayedFrames() fails, so that
   // destruction always completes.
   gpu_task_runner_->PostTask(FROM_HERE, base::Bind(
       &VTVideoDecodeAccelerator::FlushDone, weak_this_, type));
 }

 void VTVideoDecodeAccelerator::FlushDone(TaskType type) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   task_queue_.push(Task(type));
   ProcessWorkQueues();
 }

 void VTVideoDecodeAccelerator::Decode(const media::BitstreamBuffer& bitstream) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(0u, assigned_bitstream_ids_.count(bitstream.id()));
   assigned_bitstream_ids_.insert(bitstream.id());
   Frame* frame = new Frame(bitstream.id());
   pending_frames_[frame->bitstream_id] = make_linked_ptr(frame);
   decoder_thread_.message_loop_proxy()->PostTask(FROM_HERE, base::Bind(
       &VTVideoDecodeAccelerator::DecodeTask, base::Unretained(this),
       bitstream, frame));
 }

 void VTVideoDecodeAccelerator::AssignPictureBuffers(
     const std::vector<media::PictureBuffer>& pictures) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());

   for (const media::PictureBuffer& picture : pictures) {
     DCHECK(!texture_ids_.count(picture.id()));
     assigned_picture_ids_.insert(picture.id());
     available_picture_ids_.push_back(picture.id());
     texture_ids_[picture.id()] = picture.texture_id();
   }

   // Pictures are not marked as uncleared until after this method returns, and
   // they will be broken if they are used before that happens. So, schedule
   // future work after that happens.
   gpu_task_runner_->PostTask(FROM_HERE, base::Bind(
       &VTVideoDecodeAccelerator::ProcessWorkQueues, weak_this_));
 }

 void VTVideoDecodeAccelerator::ReusePictureBuffer(int32_t picture_id) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(CFGetRetainCount(picture_bindings_[picture_id]), 1);
   picture_bindings_.erase(picture_id);
   if (assigned_picture_ids_.count(picture_id) != 0) {
     available_picture_ids_.push_back(picture_id);
     ProcessWorkQueues();
   } else {
     client_->DismissPictureBuffer(picture_id);
   }
 }

 void VTVideoDecodeAccelerator::ProcessWorkQueues() {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   switch (state_) {
     case STATE_DECODING:
       // TODO(sandersd): Batch where possible.
       while (ProcessReorderQueue() || ProcessTaskQueue());
       return;

     case STATE_ERROR:
       // Do nothing until Destroy() is called.
       return;

     case STATE_DESTROYING:
       // Drop tasks until we are ready to destruct.
       while (!task_queue_.empty()) {
         if (task_queue_.front().type == TASK_DESTROY) {
           delete this;
           return;
         }
         task_queue_.pop();
       }
       return;
   }
 }

 bool VTVideoDecodeAccelerator::ProcessTaskQueue() {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(state_, STATE_DECODING);

   if (task_queue_.empty())
     return false;

   const Task& task = task_queue_.front();
   switch (task.type) {
     case TASK_FRAME:
       // TODO(sandersd): Signal IDR explicitly (not using pic_order_cnt == 0).
       if (reorder_queue_.size() < kMaxReorderQueueSize &&
           (task.frame->pic_order_cnt != 0 || reorder_queue_.empty())) {
         assigned_bitstream_ids_.erase(task.frame->bitstream_id);
         client_->NotifyEndOfBitstreamBuffer(task.frame->bitstream_id);
         reorder_queue_.push(task.frame);
         task_queue_.pop();
         return true;
       }
       return false;

     case TASK_FLUSH:
       DCHECK_EQ(task.type, pending_flush_tasks_.front());
       if (reorder_queue_.size() == 0) {
         pending_flush_tasks_.pop();
         client_->NotifyFlushDone();
         task_queue_.pop();
         return true;
       }
       return false;

     case TASK_RESET:
       DCHECK_EQ(task.type, pending_flush_tasks_.front());
       if (reorder_queue_.size() == 0) {
         last_sps_id_ = -1;
         last_pps_id_ = -1;
         last_sps_.clear();
         last_spsext_.clear();
         last_pps_.clear();
         poc_.Reset();
         pending_flush_tasks_.pop();
         client_->NotifyResetDone();
         task_queue_.pop();
         return true;
       }
       return false;

     case TASK_DESTROY:
       NOTREACHED() << "Can't destroy while in STATE_DECODING.";
       NotifyError(ILLEGAL_STATE);
       return false;
   }
 }

 bool VTVideoDecodeAccelerator::ProcessReorderQueue() {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(state_, STATE_DECODING);

   if (reorder_queue_.empty())
     return false;

   // If the next task is a flush (because there is a pending flush or becuase
   // the next frame is an IDR), then we don't need a full reorder buffer to send
   // the next frame.
   bool flushing = !task_queue_.empty() &&
                   (task_queue_.front().type != TASK_FRAME ||
                    task_queue_.front().frame->pic_order_cnt == 0);

   size_t reorder_window = std::max(0, reorder_queue_.top()->reorder_window);
   if (flushing || reorder_queue_.size() > reorder_window) {
     if (ProcessFrame(*reorder_queue_.top())) {
       reorder_queue_.pop();
       return true;
     }
   }

   return false;
 }

 bool VTVideoDecodeAccelerator::ProcessFrame(const Frame& frame) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(state_, STATE_DECODING);

   // If the next pending flush is for a reset, then the frame will be dropped.
   bool resetting = !pending_flush_tasks_.empty() &&
                    pending_flush_tasks_.front() == TASK_RESET;

   if (!resetting && frame.image.get()) {
     // If the |coded_size| has changed, request new picture buffers and then
     // wait for them.
     // TODO(sandersd): If GpuVideoDecoder didn't specifically check the size of
     // textures, this would be unnecessary, as the size is actually a property
     // of the texture binding, not the texture. We rebind every frame, so the
     // size passed to ProvidePictureBuffers() is meaningless.
     if (picture_size_ != frame.coded_size) {
       // Dismiss current pictures.
       for (int32_t picture_id : assigned_picture_ids_)
         client_->DismissPictureBuffer(picture_id);
       assigned_picture_ids_.clear();
       available_picture_ids_.clear();

       // Request new pictures.
       picture_size_ = frame.coded_size;
       client_->ProvidePictureBuffers(
           kNumPictureBuffers, coded_size_, GL_TEXTURE_RECTANGLE_ARB);
       return false;
     }
     if (!SendFrame(frame))
       return false;
   }

   return true;
 }

 bool VTVideoDecodeAccelerator::SendFrame(const Frame& frame) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   DCHECK_EQ(state_, STATE_DECODING);

   if (available_picture_ids_.empty())
     return false;

   int32_t picture_id = available_picture_ids_.back();
   IOSurfaceRef surface = CVPixelBufferGetIOSurface(frame.image.get());

   if (!make_context_current_.Run()) {
     DLOG(ERROR) << "Failed to make GL context current";
     NotifyError(PLATFORM_FAILURE);
     return false;
   }

   glEnable(GL_TEXTURE_RECTANGLE_ARB);
   gfx::ScopedTextureBinder
       texture_binder(GL_TEXTURE_RECTANGLE_ARB, texture_ids_[picture_id]);
   CGLError status = CGLTexImageIOSurface2D(
       cgl_context_,                 // ctx
       GL_TEXTURE_RECTANGLE_ARB,     // target
       GL_RGB,                       // internal_format
       frame.coded_size.width(),     // width
       frame.coded_size.height(),    // height
       GL_YCBCR_422_APPLE,           // format
       GL_UNSIGNED_SHORT_8_8_APPLE,  // type
       surface,                      // io_surface
       0);                           // plane
   if (status != kCGLNoError) {
     NOTIFY_STATUS("CGLTexImageIOSurface2D()", status);
     return false;
   }
   glDisable(GL_TEXTURE_RECTANGLE_ARB);

   available_picture_ids_.pop_back();
   picture_bindings_[picture_id] = frame.image;
   client_->PictureReady(media::Picture(
       picture_id, frame.bitstream_id, gfx::Rect(frame.coded_size)));
   return true;
 }

 void VTVideoDecodeAccelerator::NotifyError(Error error) {
   if (!gpu_thread_checker_.CalledOnValidThread()) {
     gpu_task_runner_->PostTask(FROM_HERE, base::Bind(
         &VTVideoDecodeAccelerator::NotifyError, weak_this_, error));
   } else if (state_ == STATE_DECODING) {
     state_ = STATE_ERROR;
     client_->NotifyError(error);
   }
 }

 void VTVideoDecodeAccelerator::QueueFlush(TaskType type) {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   pending_flush_tasks_.push(type);
   decoder_thread_.message_loop_proxy()->PostTask(FROM_HERE, base::Bind(
       &VTVideoDecodeAccelerator::FlushTask, base::Unretained(this),
       type));

   // If this is a new flush request, see if we can make progress.
   if (pending_flush_tasks_.size() == 1)
     ProcessWorkQueues();
 }

 void VTVideoDecodeAccelerator::Flush() {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   QueueFlush(TASK_FLUSH);
 }

 void VTVideoDecodeAccelerator::Reset() {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());
   QueueFlush(TASK_RESET);
 }

 void VTVideoDecodeAccelerator::Destroy() {
   DCHECK(gpu_thread_checker_.CalledOnValidThread());

   // In a forceful shutdown, the decoder thread may be dead already.
   if (!decoder_thread_.IsRunning()) {
     delete this;
     return;
   }

   // For a graceful shutdown, return assigned buffers and flush before
   // destructing |this|.
   // TODO(sandersd): Make sure the decoder won't try to read the buffers again
   // before discarding them.
   for (int32_t bitstream_id : assigned_bitstream_ids_)
     client_->NotifyEndOfBitstreamBuffer(bitstream_id);
   assigned_bitstream_ids_.clear();
   state_ = STATE_DESTROYING;
   QueueFlush(TASK_DESTROY);
 }

 bool VTVideoDecodeAccelerator::CanDecodeOnIOThread() {
   return false;
 }

 }  // namespace content