// Copyright (c) 2006-2007, Rodrigo Braz Monteiro // All rights reserved. // // Redistribution and use in source and binary forms, with or without // modification, are permitted provided that the following conditions are met: // // * Redistributions of source code must retain the above copyright notice, // this list of conditions and the following disclaimer. // * Redistributions in binary form must reproduce the above copyright notice, // this list of conditions and the following disclaimer in the documentation // and/or other materials provided with the distribution. // * Neither the name of the Aegisub Group nor the names of its contributors // may be used to endorse or promote products derived from this software // without specific prior written permission. // // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE // POSSIBILITY OF SUCH DAMAGE. // // ----------------------------------------------------------------------------- // // AEGISUB // // Website: http://aegisub.cellosoft.com // Contact: mailto:zeratul@cellosoft.com // /////////// // Headers #ifdef WITH_FFMPEG #ifdef WIN32 #define EMULATE_INTTYPES #define __STDC_CONSTANT_MACROS 1 #include #endif /* WIN32 */ #include #include #include #include #include "video_provider_lavc.h" #include "mkv_wrap.h" #include "lavc_file.h" #include "utils.h" #include "vfr.h" #include "ass_file.h" #include "lavc_keyframes.h" #include "video_context.h" /////////////// // Constructor LAVCVideoProvider::LAVCVideoProvider(Aegisub::String filename,double fps) { // Init variables codecContext = NULL; lavcfile = NULL; codec = NULL; stream = NULL; frame = NULL; frameRGB = NULL; bufferRGB = NULL; sws_context = NULL; buffer1 = NULL; buffer2 = NULL; buffer1Size = 0; buffer2Size = 0; vidStream = -1; validFrame = false; framesData.clear(); // Load LoadVideo(filename,fps); } ////////////// // Destructor LAVCVideoProvider::~LAVCVideoProvider() { Close(); } ////////////// // Load video void LAVCVideoProvider::LoadVideo(Aegisub::String filename, double fps) { // Close first Close(); lavcfile = LAVCFile::Create(filename); // Load try { int result = 0; // Find video stream vidStream = -1; codecContext = NULL; for (int i=0; i < (int)lavcfile->fctx->nb_streams; i++) { codecContext = lavcfile->fctx->streams[i]->codec; if (codecContext->codec_type == CODEC_TYPE_VIDEO) { stream = lavcfile->fctx->streams[i]; vidStream = i; break; } } if (vidStream == -1) throw _T("Could not find a video stream"); // Find codec codec = avcodec_find_decoder(codecContext->codec_id); if (!codec) throw _T("Could not find suitable video decoder"); // Enable truncation //if (codec->capabilities & CODEC_CAP_TRUNCATED) codecContext->flags |= CODEC_FLAG_TRUNCATED; // Open codec result = avcodec_open(codecContext,codec); if (result < 0) throw _T("Failed to open video decoder"); // Parse file for keyframes and other useful stuff LAVCKeyFrames LAVCFrameData(filename); KeyFramesList = LAVCFrameData.GetKeyFrames(); keyFramesLoaded = true; // set length etc. length = LAVCFrameData.GetNumFrames(); framesData = LAVCFrameData.GetFrameData(); #if 0 isMkv = false; length = stream->duration; if (length <= 0) { if (strcmp(formatContext->iformat->name,"matroska") == 0) { //throw _T("FFmpeg fails at seeking Matroska. If you have any idea on how to fix it, Aegisub is open source."); mkv.Open(filename); length = mkv.GetFrameCount(); bytePos = mkv.GetBytePositions(); isMkv = true; } if (length <= 0) throw _T("Returned invalid stream length"); } #endif // Allocate frame frame = avcodec_alloc_frame(); // Set frame frameNumber = -1; lastFrameNumber = -1; } // Catch errors catch (...) { Close(); throw; } } /////////////// // Close video void LAVCVideoProvider::Close() { // Close mkv #if 0 if (isMkv) mkv.Close(); #endif // Clean buffers if (buffer1) delete buffer1; if (buffer2) delete buffer2; buffer1 = NULL; buffer2 = NULL; buffer1Size = 0; buffer2Size = 0; // Clean frame if (frame) av_free((void*)frame); frame = NULL; // Free SWS context and other stuff from RGB conversion if (sws_context) sws_freeContext(sws_context); sws_context = NULL; if(frameRGB) av_free(frameRGB); frameRGB = NULL; if(bufferRGB) delete(bufferRGB); bufferRGB = NULL; // Close codec context if (codec && codecContext) avcodec_close(codecContext); codecContext = NULL; codec = NULL; // Close format context if (lavcfile) lavcfile->Release(); lavcfile = NULL; } ////////////////// // Get next frame bool LAVCVideoProvider::GetNextFrame(int64_t *startDTS) { AVPacket packet; *startDTS = -1; // magic // Read packet while (av_read_frame(lavcfile->fctx, &packet)>=0) { // Check if packet is part of video stream if(packet.stream_index == vidStream) { // Decode frame int frameFinished; if (*startDTS < 0) *startDTS = packet.dts; avcodec_decode_video(codecContext, frame, &frameFinished, packet.data, packet.size); // Success? if(frameFinished) { // Set time lastDecodeTime = packet.dts; // Free packet and return av_free_packet(&packet); return true; } } // free packet av_free_packet(&packet); } // No more packets return false; } ///////////////////////////////// //// Convert AVFrame to wxBitmap /* wxBitmap LAVCVideoProvider::AVFrameToWX(AVFrame *source, int n) { // Get sizes int w = codecContext->width; int h = codecContext->height; //#ifdef __WINDOWS__ // PixelFormat format = PIX_FMT_RGBA32; //#else PixelFormat format = PIX_FMT_RGB24; //#endif unsigned int size1 = avpicture_get_size(codecContext->pix_fmt,display_w,display_h); unsigned int size2 = avpicture_get_size(format,display_w,display_h); // Prepare buffers if (!buffer1 || buffer1Size != size1) { if (buffer1) delete buffer1; buffer1 = new uint8_t[size1]; buffer1Size = size1; } if (!buffer2 || buffer2Size != size2) { if (buffer2) delete buffer2; buffer2 = new uint8_t[size2]; buffer2Size = size2; } // Resize AVFrame *resized; bool resize = w != display_w || h != display_h; if (resize) { // Allocate unsigned int resSize = avpicture_get_size(codecContext->pix_fmt,display_w,display_h); resized = avcodec_alloc_frame(); avpicture_fill((AVPicture*) resized, buffer1, codecContext->pix_fmt, display_w, display_h); // Resize ImgReSampleContext *resampleContext = img_resample_init(display_w,display_h,w,h); img_resample(resampleContext,(AVPicture*) resized,(AVPicture*) source); img_resample_close(resampleContext); // Set new w/h w = display_w; h = display_h; } else resized = source; // Allocate RGB32 buffer AVFrame *frameRGB = avcodec_alloc_frame(); avpicture_fill((AVPicture*) frameRGB, buffer2, format, w, h); // Convert to RGB32 img_convert((AVPicture*) frameRGB, format, (AVPicture*) resized, codecContext->pix_fmt, w, h); // Convert to wxBitmap wxImage img(w, h, false); unsigned char *data = (unsigned char *)malloc(w * h * 3); memcpy(data, frameRGB->data[0], w * h * 3); img.SetData(data); if (overlay) overlay->Render(img, VFR_Input.GetTimeAtFrame(n)); wxBitmap bmp(img); av_free(frameRGB); if (resized != source) av_free(resized); return bmp; } */ ///////////// // Get frame const AegiVideoFrame LAVCVideoProvider::GetFrame(int n,int formatType) { // Return stored frame // n = MID(0,n,GetFrameCount()-1); if (n == lastFrameNumber) { if (!validFrame) validFrame = true; return curFrame; } if (frameNumber < 0) frameNumber = 0; // Following frame, just get it /* if (n == frameNumber+1) { int64_t temp = -1; GetNextFrame(&temp); } */ // Needs to seek // else { // Prepare seek // int64_t seekTo; // int result = 0; int closestKeyFrame = FindClosestKeyframe(n); #if 0 // Get time to seek to if (isMkv) { //int64_t base = AV_TIME_BASE; //int64_t time = VFR_Output.GetTimeAtFrame(n,true) * base / 1000000; //seekTo = av_rescale(time,stream->time_base.den,AV_TIME_BASE * int64_t(stream->time_base.num)); //seekTo = int64_t(n) * 1000 * stream->r_frame_rate.den / stream->r_frame_rate.num; //seekTo = bytePos[n]; //result = av_seek_frame(formatContext,vidStream,seekTo,AVSEEK_FLAG_BACKWARD | AVSEEK_FLAG_BYTE); // Prepare mkv seek ulonglong startTime, endTime, filePos; unsigned int rt, frameSize, frameFlags; ulonglong targetTime = (int64_t)(VFR_Output.GetTimeAtFrame(n,true,true))*1000000; //ulonglong targetTime = (int64_t)(n) * 1000 * stream->r_frame_rate.den / stream->r_frame_rate.num; //ulonglong targetTime = mkv.rawFrames[n].time * 1000000; mkv_Seek(mkv.file,targetTime,MKVF_SEEK_TO_PREV_KEYFRAME); // Seek if (mkv_ReadFrame(mkv.file,0,&rt,&startTime,&endTime,&filePos,&frameSize,&frameFlags) == 0) { result = av_seek_frame(formatContext,vidStream,filePos,AVSEEK_FLAG_BYTE | AVSEEK_FLAG_BACKWARD); int curpos = 0; for (unsigned int i=0;i frameNumber+10) { // do it av_seek_frame(lavcfile->fctx, vidStream, framesData[closestKeyFrame].DTS, AVSEEK_FLAG_BACKWARD); avcodec_flush_buffers(codecContext); hasSeeked = true; } // decode frames until we have the one we want do { int64_t startTime; GetNextFrame(&startTime); if (hasSeeked) { hasSeeked = false; // is the seek destination known? does it belong to a frame? if (startTime < 0 || (frameNumber = FrameFromDTS(startTime)) < 0) throw _T("ffmpeg video provider: frame accurate seeking failed"); //frameNumber = ClosestFrameFromDTS(startTime); } frameNumber++; } while (frameNumber <= n); // Seek to keyframe /* if (result == 0) { avcodec_flush_buffers(codecContext); // Seek until final frame bool ok = true; do { ok = GetNextFrame(); } while (lastDecodeTime <= n && ok); } // Failed seeking else { GetNextFrame(); }*/ #if 0 } #endif //} // Get aegisub frame AegiVideoFrame &final = curFrame; if (frame) { int w = codecContext->width; int h = codecContext->height; PixelFormat srcFormat = codecContext->pix_fmt; PixelFormat dstFormat = PIX_FMT_RGB32; // Allocate RGB32 buffer if(!sws_context) //first frame { frameRGB = avcodec_alloc_frame(); unsigned int dstSize = avpicture_get_size(dstFormat,w,h); bufferRGB = new uint8_t[dstSize]; sws_context = sws_getContext(w, h, srcFormat, w, h, dstFormat, SWS_PRINT_INFO, NULL, NULL, NULL); } avpicture_fill((AVPicture*) frameRGB, bufferRGB, dstFormat, w, h); // Set AegiVideoFrame final.w = codecContext->width; final.h = codecContext->height; final.flipped = false; final.invertChannels = true; final.format = FORMAT_RGB32; // Allocate for (int i=0;i<4;i++) final.pitch[i] = frameRGB->linesize[i]; final.Allocate(); // Convert to RGB32, and write directly to the output frame sws_scale(sws_context, frame->data, frame->linesize, 0, h, final.data, frameRGB->linesize); } else // No frame available { final = AegiVideoFrame(GetWidth(),GetHeight()); } // Set current frame validFrame = true; lastFrameNumber = n; // Return return final; } //////////////// // Get position int LAVCVideoProvider::GetPosition() { return frameNumber; } //////////////////////// // Get number of frames int LAVCVideoProvider::GetFrameCount() { return length; } ////////////////// // Get frame rate double LAVCVideoProvider::GetFPS() { return double(stream->r_frame_rate.num) / double(stream->r_frame_rate.den); } ////////////////////// // Get original width int LAVCVideoProvider::GetWidth() { return codecContext->width; } /////////////////////// // Get original height int LAVCVideoProvider::GetHeight() { return codecContext->height; } ////////////////////// // Find the keyframe we should seek to if we want to seek to a given frame N int LAVCVideoProvider::FindClosestKeyframe(int frameN) { for (int i = frameN; i > 0; i--) if (framesData[i].isKeyFrame) return i; return 0; } ////////////////////// // Convert a DTS into a frame number int LAVCVideoProvider::FrameFromDTS(int64_t ADTS) { for (int i = 0; i < (int)framesData.size(); i++) if (framesData[i].DTS == ADTS) return i; return -1; } ////////////////////// // Find closest frame to the given DTS int LAVCVideoProvider::ClosestFrameFromDTS(int64_t ADTS) { int n = 0; int64_t bestDiff = 0xFFFFFFFFFFFFFFLL; // big number for (int i = 0; i < (int)framesData.size(); i++) { int64_t currentDiff = FFABS(framesData[i].DTS - ADTS); if (currentDiff < bestDiff) { bestDiff = currentDiff; n = i; } } return n; } #endif // WITH_FFMPEG