cpp/api/VideoPicture_8cpp_source.html

 /*******************************************************************************

  * Copyright (c) 2024, 2026, Olivier Ayache.  All rights reserved.

  *

  * This file is part of AVPKit.

  *

  * AVPKit is free software: you can redistribute it and/or modify

  * it under the terms of the GNU Lesser General Public License as published by

  * the Free Software Foundation, either version 3 of the License, or

  * (at your option) any later version.

  *

  * AVPKit is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public License

  * along with AVPKit.  If not, see <http://www.gnu.org/licenses/>.

  *******************************************************************************/


 #include <stdexcept>

 // for memset

 #include <cstring>

 #include <com/avpkit/ferry/Logger.h>

 #include <com/avpkit/ferry/RefPointer.h>

 #include <com/avpkit/core/Global.h>

 #include "com/avpkit/core/VideoPicture.h"


 extern "C" {

 #include <libavcodec/mediacodec.h>

 #ifdef __APPLE__

 #include <CoreMedia/CMSampleBuffer.h>

 #endif

 }


 VS_LOG_SETUP(VS_CPP_PACKAGE);


 namespace com { namespace avpkit { namespace core

 {


   VideoPicture :: VideoPicture()

   {

     mIsComplete = false;

     mFrame = av_frame_alloc();

     if (!mFrame)

       throw std::bad_alloc();

     // Set the private data pointer to point to me.

     mFrame->opaque = this;

     mFrame->width = -1;

     mFrame->height = -1;


     mFrame->format = (int) IPixelFormat::NONE;

     mTimeBase = IRational::make(1, 1000000);


 #ifdef __APPLE__

     mCMSampleBuffer = NULL;

 #endif


   }


   VideoPicture :: ~VideoPicture()

   {

     if (mFrame)

       av_free(mFrame);

     mFrame = 0;

     mBuffer = 0;

     mTimeBase = 0;

 #ifdef __APPLE__

     if (mCMSampleBuffer){

         CFRelease(mCMSampleBuffer);

     }

 #endif

   }


   VideoPicture*

   VideoPicture :: make(IPixelFormat::Type format, int width, int height)

   {

     VideoPicture * retval=0;

     try {

       retval = VideoPicture::make();

       retval->mFrame->format = format;

       retval->mFrame->width = width;

       retval->mFrame->height = height;

       // default new frames to be key frames

       retval->setKeyFrame(true);

     }

     catch (std::bad_alloc &e)

     {

       VS_REF_RELEASE(retval);

       throw e;

     }

     catch (std::exception& e)

     {

       VS_LOG_DEBUG("error: %s", e.what());

       VS_REF_RELEASE(retval);

     }


     return retval;

   }


   VideoPicture*

   VideoPicture :: make(

       com::avpkit::ferry::IBuffer* buffer, IPixelFormat::Type format,

       int width, int height)

   {

     if (!buffer)

       return 0;

     VideoPicture *retval = 0;

     try {

       retval = make(format, width,height);

       if (!retval)

         throw std::bad_alloc();


       int32_t size = retval->getSize();

       if (size > 0 && size > buffer->getBufferSize())

         throw std::runtime_error("input buffer is not large enough for given picture");


       retval->mBuffer.reset(buffer, true);

       unsigned char* bytes = (unsigned char*)buffer->getBytes(0, size);

       if (!bytes)

         throw std::runtime_error("could not access raw memory in buffer");


       (void) av_image_fill_arrays(retval->mFrame->data,

               retval->mFrame->linesize,

               bytes,

               (AVPixelFormat) format,

               width,

               height,

               1);


     }

     catch (std::bad_alloc &e)

     {

       VS_REF_RELEASE(retval);

       throw e;

     }

     catch (std::exception& e)

     {

       VS_LOG_DEBUG("error: %s", e.what());

       VS_REF_RELEASE(retval);

     }

     return retval;

   }


   void

   VideoPicture :: setData(com::avpkit::ferry::IBuffer* buffer)

   {

     if (!buffer) return;

     mBuffer.reset(buffer, true);

   }


   bool

   VideoPicture :: copy(IVideoPicture * srcFrame)

   {

     bool result = false;

     try

     {

       if (!srcFrame)

         throw std::runtime_error("empty source frame to copy");


       if (!srcFrame->isComplete())

         throw std::runtime_error("source frame is not complete");


       VideoPicture* src = static_cast<VideoPicture*>(srcFrame);

       if (!src)

         throw std::runtime_error("src frame is not of right subtype");


       // now copy the data

       allocInternalFrameBuffer();


       // get the raw buffers

       unsigned char* srcBuffer = (unsigned char*)src->mBuffer->getBytes(0, src->getSize());

       unsigned char* dstBuffer = (unsigned char*)mBuffer->getBytes(0, getSize());

       if (!srcBuffer || !dstBuffer)

         throw std::runtime_error("could not get buffer to copy");

       memcpy(dstBuffer, srcBuffer, getSize());


       this->setComplete(true,

           srcFrame->getPixelType(),

           srcFrame->getWidth(),

           srcFrame->getHeight(),

           srcFrame->getPts());

       result = true;

     }

     catch (std::exception & e)

     {

       VS_LOG_DEBUG("error: %s", e.what());

       result = false;

     }

     return result;

   }


   com::avpkit::ferry::IBuffer*

   VideoPicture :: getData()

   {

     com::avpkit::ferry::IBuffer *retval = 0;

     try {

       if (getSize() > 0) {

         if (!mBuffer || mBuffer->getBufferSize() < getSize())

         {

           allocInternalFrameBuffer();

         }

         retval = mBuffer.get();

         if (!retval) {

           throw std::bad_alloc();

         }

       }

     } catch (std::bad_alloc &e) {

       VS_REF_RELEASE(retval);

       throw e;

     } catch (std::exception & e)

     {

       VS_LOG_DEBUG("Error: %s", e.what());

       VS_REF_RELEASE(retval);

     }

     return retval;

   }


   void

   VideoPicture::render(bool drop, int64_t timeStamp) {

       if (mFrame && (av_pix_fmt_desc_get((AVPixelFormat) mFrame->format)->flags & AV_PIX_FMT_FLAG_HWACCEL)) {

         #ifdef __ANDROID__

           mediacodec_render_frame(mFrame, timeStamp, drop);

         #elif __APPLE__

           CVImageBufferRef image = (CVImageBufferRef) mFrame->data[3];

           CMVideoFormatDescriptionRef formatDescription;

           if (mCMSampleBuffer){

               CFRelease(mCMSampleBuffer);

           }

           CMTime duration = kCMTimeIndefinite;

           CMTime pts = CMTimeMake(timeStamp , 1000000000);

           const CMSampleTimingInfo timingInfo = {

                         .decodeTimeStamp = kCMTimeInvalid,

                         .duration = duration,

                         .presentationTimeStamp = pts

                     };

           CMVideoFormatDescriptionCreateForImageBuffer(NULL, image, &formatDescription);

           CMSampleBufferCreateReadyWithImageBuffer(NULL, image, formatDescription, &timingInfo, &mCMSampleBuffer);

           return sampleBuffer;

         #endif

       }

   }


   void*

   VideoPicture :: getOpaqueData()

   {

     #ifdef __APPLE__

       return mCMSampleBuffer;

     #endif


     return NULL;

   }


   void

   VideoPicture :: fillAVFrame(AVFrame *frame)

   {

     if (!mBuffer || mBuffer->getBufferSize() < getSize())

       allocInternalFrameBuffer();

     unsigned char* buffer = (unsigned char*)mBuffer->getBytes(0, getSize());

     // This is an inherently unsafe operation; it copies over all the bits in the AVFrame

     memcpy(frame, mFrame, sizeof(AVFrame));

     //*frame = *mFrame;

     // and then relies on avpicture_fill to overwrite any areas in frame that

     // are pointed to the wrong place.

     av_image_fill_arrays(frame->data,

               frame->linesize,

               buffer,

               (AVPixelFormat) frame->format,

               frame->width,

               frame->height,

               1);

     frame->quality = getQuality();

 //    frame->type = FF_BUFFER_TYPE_USER;

   }


   void

   VideoPicture :: copyAVFrame(AVFrame* frame, IPixelFormat::Type pixel,

       int32_t width, int32_t height)

   {

     try

     {

       // Need to copy the contents of frame->data to our

       // internal buffer.

       VS_ASSERT(frame, "no frame?");

       if (!(av_pix_fmt_desc_get((AVPixelFormat) pixel)->flags & AV_PIX_FMT_FLAG_HWACCEL)) {

         VS_ASSERT(frame->data[0], "no data in frame");

         // resize the frame to the AVFrame

         mFrame->width = width;

         mFrame->height = height;

         mFrame->format = (int)pixel;


         int bufSize = getSize();

         if (bufSize <= 0)

           throw std::runtime_error("invalid size for frame");


         if (!mBuffer || mBuffer->getBufferSize() < bufSize)

           // reuse buffers if we can.

           allocInternalFrameBuffer();


         uint8_t* buffer = (uint8_t*)mBuffer->getBytes(0, bufSize);

         if (!buffer)

           throw std::runtime_error("really?  no buffer");


         if (frame->data[0])

         {

           // Make sure the frame isn't already using our buffer

           if(buffer != frame->data[0])

           {

             av_image_fill_arrays(mFrame->data, mFrame->linesize, buffer,

               (AVPixelFormat) frame->format, width, height, 1);

             av_image_copy(mFrame->data, mFrame->linesize, (const uint8_t **)frame->data,

                   frame->linesize, (AVPixelFormat)frame->format, frame->width, frame->height);

           }

           mFrame->key_frame = frame->key_frame;

         }

         else

         {

           throw std::runtime_error("no data in frame to copy");

         }

       }

       else

       {

         mFrame->width = width;

         mFrame->height = height;

 //      mFrame->format = (int) pixel;

         if (pixel != IPixelFormat::MEDIACODEC)

         {

             //mFrame->hw_frames_ctx = frame->hw_frames_ctx;

           av_hwframe_transfer_data(mFrame, frame, 0);

         }

         else

         {

             //av_frame_copy_props(mFrame, frame);

           mFrame->data[3] = frame->data[3];

         }

       }

     }

     catch (std::exception & e)

     {

       VS_LOG_DEBUG("error: %s", e.what());

     }

   }


   AVFrame*

   VideoPicture :: getAVFrame()

   {

     if (!mBuffer || mBuffer->getBufferSize() < getSize())

     {

       // reuse buffers if we can.

       allocInternalFrameBuffer();

     }

     return mFrame;

   }


   int

   VideoPicture :: getDataLineSize(int lineNo)

   {

     int retval = -1;

     if (getAVFrame()

         && lineNo >= 0

         && (unsigned int) lineNo < (sizeof(mFrame->linesize)/sizeof(mFrame->linesize[0])))

       retval = mFrame->linesize[lineNo];

     return retval;

   }


   bool

   VideoPicture :: isKeyFrame()

   {

     return (mFrame ? mFrame->key_frame : false);

   }


   void

   VideoPicture :: setKeyFrame(bool aIsKey)

   {

     if (mFrame)

       mFrame->key_frame = aIsKey;

   }


   int64_t

   VideoPicture :: getPts()

   {

     return (mFrame ? mFrame->pts : -1);

   }


   void

   VideoPicture :: setPts(int64_t value)

   {

     if (mFrame)

       mFrame->pts = value;

   }


   int

   VideoPicture :: getQuality()

   {

     return (mFrame ? mFrame->quality : FF_LAMBDA_MAX);

   }


   void

   VideoPicture :: setQuality(int newQuality)

   {

     if (newQuality < 0 || newQuality > FF_LAMBDA_MAX)

       newQuality = FF_LAMBDA_MAX;

     if (mFrame)

       mFrame->quality = newQuality;

   }


   void

   VideoPicture :: setComplete(

       bool aIsComplete,

       IPixelFormat::Type format,

       int width,

       int height,

       int64_t pts

   )

   {

     try {

       mIsComplete = aIsComplete;


       if (mIsComplete)

       {

         setPts(pts);

       }


       if (!mFrame)

         throw std::runtime_error("no AVFrame allocated");

       if (format != IPixelFormat::NONE && mFrame->format != (int)IPixelFormat::NONE && (int)format != mFrame->format)

         throw std::runtime_error("pixel formats don't match");

       if (width > 0 && mFrame->width >0 && width != mFrame->width)

         throw std::runtime_error("width does not match");

       if (height > 0 && mFrame->height > 0 && height != mFrame->height)

         throw std::runtime_error("height does not match");

     }

     catch (std::exception& e)

     {

       VS_LOG_DEBUG("error: %s", e.what());

     }

   }


   int32_t

   VideoPicture :: getSize()

   {

     int retval = -1;

     if (mFrame->width > 0 && mFrame->height > 0)

       retval = av_image_get_buffer_size((AVPixelFormat)mFrame->format, mFrame->width, mFrame->height, 1);

     return retval;

   }


   void

   VideoPicture :: allocInternalFrameBuffer()

   {

     int bufSize = getSize();

     if (bufSize <= 0)

       throw std::runtime_error("invalid size for frame");


     // reuse buffers if we can.

     if (!mBuffer || mBuffer->getBufferSize() < bufSize)

     {

       // Now, it turns out some accelerated assembly functions will

       // read at least a word past the end of an image buffer, so

       // we make space for that to happen.

       // I arbitrarily choose the sizeof a long-long (64 bit).


       // note that if the user has passed in their own buffer that is

       // the right 'size' but doesnt have this padding, we let it through anyway.

       int extraBytes=sizeof(int64_t);


       // Make our copy buffer.

       mBuffer = com::avpkit::ferry::IBuffer::make(this, bufSize+extraBytes);

       if (!mBuffer) {

         throw std::bad_alloc();

       }


       // Now, to further work around issues, I added the extra 8-bytes,

       // and now I'm going to zero just those 8-bytes out.  I don't

       // zero-out the whole buffer because I want Valgrind to detect

       // if it's not written to first.  But I know this overrun

       // issue exists in the MMX conversions in SWScale for some libraries,

       // so I'm going to fake it out here.

       {

         unsigned char * buf =

           ((unsigned char*)mBuffer->getBytes(0, bufSize+extraBytes));


         memset(buf+bufSize, 0, extraBytes);

       }

     }

     uint8_t* buffer = (uint8_t*)mBuffer->getBytes(0, bufSize);

     if (!buffer)

       throw std::bad_alloc();


     int imageSize = av_image_fill_arrays(mFrame->data,

         mFrame->linesize,

         buffer,

         (AVPixelFormat)mFrame->format,

         mFrame->width,

         mFrame->height,

         1);

     if (imageSize != bufSize)

       throw std::runtime_error("could not fill picture");


 //    mFrame->type = FF_BUFFER_TYPE_USER;

     VS_ASSERT(mFrame->data[0] != 0, "Empty buffer");

   }


   IVideoPicture::PictType

   VideoPicture :: getPictureType()

   {

     IVideoPicture::PictType retval = IVideoPicture::DEFAULT_TYPE;

     if (mFrame)

       retval = (PictType) mFrame->pict_type;

     return retval;

   }


   void

   VideoPicture :: setPictureType(IVideoPicture::PictType type)

   {

     if (mFrame)

       mFrame->pict_type = (enum AVPictureType) type;

   }


   void

   VideoPicture::setSideData(IVideoPicture::FrameDataType type, com::avpkit::ferry::IBuffer* buffer) {

       if (mFrame){

         av_frame_new_side_data(mFrame, (AVFrameSideDataType)type, buffer->getSize());

       }

   }


 }}}

com::avpkit::core::IPixelFormat::Type
Type
Pixel format.
Definition: IPixelFormat.h:65

com::avpkit::core::IPixelFormat::MEDIACODEC
@ MEDIACODEC
HW decoding through Android MediaCodec
Definition: IPixelFormat.h:288

com::avpkit::core::IRational::make
static IRational * make()
Get a new rational that will be set to 0/0.
Definition: IRational.cpp:79

com::avpkit::core::IVideoPicture
Represents one raw (undecoded) picture in a video stream, plus a timestamp for when to display that v...
Definition: IVideoPicture.h:40

com::avpkit::core::IVideoPicture::getWidth
virtual int getWidth()=0
What is the width of the picture.

com::avpkit::core::IVideoPicture::getHeight
virtual int getHeight()=0
What is the height of the picture.

com::avpkit::core::IVideoPicture::getPixelType
virtual IPixelFormat::Type getPixelType()=0
Returns the pixel format of the picture.

com::avpkit::core::IVideoPicture::isComplete
virtual bool isComplete()=0
Is this picture completely decoded?

com::avpkit::core::IVideoPicture::PictType
PictType
The different types of images that we can set.
Definition: IVideoPicture.h:221

com::avpkit::core::IVideoPicture::FrameDataType
FrameDataType
Definition: IVideoPicture.h:255

com::avpkit::core::IVideoPicture::getPts
virtual int64_t getPts()=0
What is the Presentation Time Stamp (in Microseconds) of this picture.

com::avpkit::core::VideoPicture
Definition: VideoPicture.h:34

com::avpkit::core::VideoPicture::setComplete
virtual void setComplete(bool aIsComplete, IPixelFormat::Type format, int width, int height, int64_t pts)
After modifying the raw data in this buffer, call this function to let the object know it is now comp...
Definition: VideoPicture.cpp:410

com::avpkit::core::VideoPicture::setData
virtual void setData(com::avpkit::ferry::IBuffer *buffer)
Sets the underlying buffer used by this object.
Definition: VideoPicture.cpp:147

com::avpkit::core::VideoPicture::getPts
virtual int64_t getPts()
What is the Presentation Time Stamp (in Microseconds) of this picture.
Definition: VideoPicture.cpp:382

com::avpkit::core::VideoPicture::getSize
virtual int32_t getSize()
Total size in bytes of the decoded picture.
Definition: VideoPicture.cpp:442

com::avpkit::core::VideoPicture::copyAVFrame
void copyAVFrame(AVFrame *frame, IPixelFormat::Type pixel, int32_t width, int32_t height)
Called by the StreamCoder once it's done decoding.
Definition: VideoPicture.cpp:279

com::avpkit::core::VideoPicture::setKeyFrame
virtual void setKeyFrame(bool aIsKey)
Reset if this is a key frame or not.
Definition: VideoPicture.cpp:375

com::avpkit::core::VideoPicture::isKeyFrame
virtual bool isKeyFrame()
Is this a key frame?
Definition: VideoPicture.cpp:369

com::avpkit::core::VideoPicture::setPictureType
virtual void setPictureType(IVideoPicture::PictType type)
Set the picture type.
Definition: VideoPicture.cpp:516

com::avpkit::core::VideoPicture::getData
virtual com::avpkit::ferry::IBuffer * getData()
Get any underlying raw data available for this object.
Definition: VideoPicture.cpp:196

com::avpkit::core::VideoPicture::setPts
virtual void setPts(int64_t)
Set the Presentation Time Stamp (in Microseconds) for this picture.
Definition: VideoPicture.cpp:388

com::avpkit::core::VideoPicture::getPictureType
virtual IVideoPicture::PictType getPictureType()
Get the picture type.
Definition: VideoPicture.cpp:507

com::avpkit::core::VideoPicture::getDataLineSize
virtual int getDataLineSize(int lineNo)
Return the size of each line in the VideoPicture data.
Definition: VideoPicture.cpp:358

com::avpkit::core::VideoPicture::fillAVFrame
void fillAVFrame(AVFrame *frame)
Called by the StreamCoder before it encodes a picture.
Definition: VideoPicture.cpp:257

com::avpkit::core::VideoPicture::copy
virtual bool copy(IVideoPicture *srcFrame)
Copy the contents of the given picture into this picture.
Definition: VideoPicture.cpp:155

com::avpkit::core::VideoPicture::setQuality
virtual void setQuality(int newQuality)
Set the Quality to a new value.
Definition: VideoPicture.cpp:401

com::avpkit::core::VideoPicture::getQuality
virtual int getQuality()
This value is the quality setting this VideoPicture had when it was decoded, or is the value to use w...
Definition: VideoPicture.cpp:395

com::avpkit::core::VideoPicture::make
static VideoPicture * make(IPixelFormat::Type format, int width, int height)
The default factory for a frame.
Definition: VideoPicture.cpp:75

com::avpkit::core::VideoPicture::render
virtual void render(bool drop, int64_t timeStamp)
Render this picture on configured surface.
Definition: VideoPicture.cpp:222

com::avpkit::core::VideoPicture::getAVFrame
VS_API_AVPKIT AVFrame * getAVFrame()
Call to get the raw underlying AVFrame we manage; don't pass this to ffmpeg directly as ffmpeg often ...
Definition: VideoPicture.cpp:347

com::avpkit::ferry::IBuffer
Allows Java code to get data from a native buffers, and optionally modify native memory directly.
Definition: IBuffer.h:54

com::avpkit::ferry::IBuffer::make
static IBuffer * make(RefCounted *requestor, void *bufToWrap, int32_t bufferSize, FreeFunc freeFunc, void *closure)
Allocate a new buffer by wrapping a native buffer.
Definition: IBuffer.cpp:48

com::avpkit::ferry::IBuffer::getBytes
virtual void * getBytes(int32_t offset, int32_t length)=0
Returns up to length bytes, starting at offset in the underlying buffer we're managing.

com::avpkit::ferry::IBuffer::getBufferSize
virtual int32_t getBufferSize()=0
Get the current maximum number of bytes that can be safely placed in this buffer.

com::avpkit::ferry::IBuffer::getSize
virtual int32_t getSize()=0
Returns the size, in units of getType() of this buffer.

com::avpkit::ferry::RefPointer::get
T * get()
Call RefCounted::acquire() on the managed pointer and return it.
Definition: RefPointer.h:206

com::avpkit::ferry::RefPointer::reset
void reset(T *ptr=0, bool acquire=false)
Reset the managed pointer, calling RefCounted::release() on the previously managed pointer first.
Definition: RefPointer.h:237

com
WARNING: Do not use logging in this class, and do not set any static file variables to values other t...
Definition: AudioResampler.cpp:30