SmartAudio/package/allwinner/tina_multimedia/libcedarx/xmetadataretriever/xmetadataretriever.c

1896 lines
63 KiB
C
Raw Permalink Normal View History

2018-07-13 01:31:50 +00:00
/*
* Copyright (c) 2008-2016 Allwinner Technology Co. Ltd.
* All rights reserved.
*
* File : xmetadataretriever.c
* Description : xmetadataretriever for Linux,
* get mediainfo and thumbnail picture
* History :
*
*/
#define LOG_TAG "xmetadataretriever"
#include "cdx_log.h"
#include "xmetadataretriever.h"
#include "memoryAdapter.h"
#include "iniparserapi.h"
#include <stdio.h>
#include <stdlib.h>
#include <sys/time.h>
#include <inttypes.h>
#define SAVE_BITSTREAM 0
#define SAVE_RGB 0
#if SAVE_BITSTREAM
const char* bitstreamPath = "/data/camera/out.h264";
static FILE* fph264 = NULL;
#endif
/* process 1024 packets to get a frame at maximum. */
#define MAX_PACKET_COUNT_TO_GET_A_FRAME 4096
#define MAX_TIME_TO_GET_A_FRAME 5000000 /* use 5 seconds to get a frame at maximum. */
#define MAX_TIME_TO_GET_A_STREAM 10000000 /* use 10 seconds to get a stream at maximum. */
#define MAX_OUTPUT_STREAM_SIZE (1024*1024)
typedef struct XRetrieverContext
{
CdxDataSourceT mSource;
CdxMediaInfoT mMediaInfo;
CdxParserT* mParser;
CdxStreamT* mStream;
VideoDecoder* mVideoDecoder;
XVideoFrame mVideoFrame;
XVideoStream mVideoStream;
int mCancelPrepareFlag;
struct ScMemOpsS *memops;
}XRetrieverContext;
static int64_t GetSysTime();
#if SAVE_RGB
//-------------------------------------------------------------------
/*
<EFBFBD><EFBFBD><EFBFBD><EFBFBD>λͼ<EFBFBD>ļ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <EFBFBD><EFBFBD> <EFBFBD><EFBFBD>
λͼ<EFBFBD>ļ<EFBFBD>ͷ (bitmap-file header) BITMAPFILEHEADER bmfh
λͼ<EFBFBD><EFBFBD>Ϣͷ (bitmap-information header) BITMAPINFOHEADER bmih
<EFBFBD><EFBFBD>ɫ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>(color table) RGBQUAD aColors[]
ͼ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ֽ<EFBFBD> BYTE aBitmapBits[]
*/
typedef struct bmp_header
{
short twobyte ;//<2F><><EFBFBD><EFBFBD><EFBFBD>ֽڣ<D6BD><DAA3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>֤<EFBFBD><D6A4><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ա<EFBFBD><D4B1><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>У<EFBFBD><D0A3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ַ<EFBFBD><D6B7><EFBFBD><EFBFBD><EFBFBD>д<EFBFBD><D0B4><EFBFBD>ļ<EFBFBD><C4BC><EFBFBD>
//14B
char bfType[2] ;//!<21>ļ<EFBFBD><C4BC><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>,<2C><>ֵ<EFBFBD><D6B5><EFBFBD><EFBFBD><EFBFBD><EFBFBD>0x4D42<34><32>Ҳ<EFBFBD><D2B2><EFBFBD><EFBFBD><EFBFBD>ַ<EFBFBD>'BM'
unsigned int bfSize ;//!˵<><CBB5><EFBFBD>ļ<EFBFBD><C4BC>Ĵ<EFBFBD>С<EFBFBD><D0A1><EFBFBD><EFBFBD><EFBFBD>ֽ<EFBFBD>Ϊ<EFBFBD><CEAA>λ
unsigned int bfReserved1;//<2F><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ϊ0
unsigned int bfOffBits ;//!˵<><CBB5><EFBFBD><EFBFBD><EFBFBD>ļ<EFBFBD>ͷ<EFBFBD><CDB7>ʼ<EFBFBD><CABC>ʵ<EFBFBD>ʵ<EFBFBD>ͼ<EFBFBD><CDBC><EFBFBD><EFBFBD><EFBFBD><EFBFBD>֮<EFBFBD><D6AE><EFBFBD><EFBFBD><EFBFBD>ֽڵ<D6BD>ƫ<EFBFBD><C6AB><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ϊ14B+sizeof(BMPINFO)
}BMPHEADER;
typedef struct bmp_info
{
//40B
unsigned int biSize ;//!BMPINFO<46><EFBFBD><E1B9B9><EFBFBD><EFBFBD>Ҫ<EFBFBD><D2AA><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
int biWidth ;//!ͼ<><CDBC><EFBFBD>Ŀ<EFBFBD><C4BF>ȣ<EFBFBD><C8A3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ϊ<EFBFBD><CEAA>λ
int biHeight ;//!ͼ<><CDBC><EFBFBD>Ŀ<EFBFBD><C4BF>ȣ<EFBFBD><C8A3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ϊ<EFBFBD><CEAA>λ,<2C><><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ֵ<EFBFBD><D6B5><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
//˵<><CBB5>ͼ<EFBFBD><CDBC><EFBFBD>ǵ<EFBFBD><C7B5><EFBFBD><EFBFBD>ģ<EFBFBD><C4A3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ֵ<EFBFBD>Ǹ<EFBFBD><C7B8><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
unsigned short biPlanes ;//!Ŀ<><C4BF><EFBFBD>豸˵<E8B1B8><CBB5>λ<EFBFBD><CEBB><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ֵ<EFBFBD><D6B5><EFBFBD><EFBFBD><EFBFBD>DZ<EFBFBD><C7B1><EFBFBD>Ϊ1
unsigned short biBitCount ;//!<21><><EFBFBD><EFBFBD><EFBFBD><EFBFBD>/<2F><><EFBFBD>أ<EFBFBD><D8A3><EFBFBD>ֵΪ1<CEAA><31>4<EFBFBD><34>8<EFBFBD><38>16<31><36>24<32><34><EFBFBD><EFBFBD>32
unsigned int biCompression ;//˵<><CBB5>ͼ<EFBFBD><CDBC><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ѹ<EFBFBD><D1B9><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
#define BI_RGB 0L //û<><C3BB>ѹ<EFBFBD><D1B9>
#define BI_RLE8 1L //ÿ<><C3BF><EFBFBD><EFBFBD><EFBFBD><EFBFBD>8<EFBFBD><38><EFBFBD>ص<EFBFBD>RLEѹ<45><D1B9><EFBFBD><EFBFBD><EFBFBD>룬ѹ<EBA3AC><D1B9><EFBFBD><EFBFBD>ʽ<EFBFBD><CABD>2<EFBFBD>ֽ<EFBFBD><D6BD><EFBFBD><EFBFBD>ɣ<EFBFBD><C9A3>ظ<EFBFBD><D8B8><EFBFBD><EFBFBD>ؼ<EFBFBD><D8BC><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɫ<EFBFBD><C9AB><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
#define BI_RLE4 2L //ÿ<><C3BF><EFBFBD><EFBFBD><EFBFBD><EFBFBD>4<EFBFBD><34><EFBFBD>ص<EFBFBD>RLEѹ<45><D1B9><EFBFBD><EFBFBD><EFBFBD>룬ѹ<EBA3AC><D1B9><EFBFBD><EFBFBD>ʽ<EFBFBD><CABD>2<EFBFBD>ֽ<EFBFBD><D6BD><EFBFBD><EFBFBD><EFBFBD>
#define BI_BITFIELDS 3L //ÿ<><C3BF><EFBFBD><EFBFBD><EFBFBD>صı<D8B5><C4B1><EFBFBD><EFBFBD><EFBFBD>ָ<EFBFBD><D6B8><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
unsigned int biSizeImage ;//ͼ<><CDBC><EFBFBD>Ĵ<EFBFBD>С<EFBFBD><D0A1><EFBFBD><EFBFBD><EFBFBD>ֽ<EFBFBD>Ϊ<EFBFBD><CEAA>λ<EFBFBD><CEBB><EFBFBD><EFBFBD><EFBFBD><EFBFBD>BI_RGB<47><42>ʽʱ<CABD><CAB1><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ϊ0
int biXPelsPerMeter ;//ˮƽ<CBAE>ֱ<EFBFBD><D6B1>ʣ<EFBFBD><CAA3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>/<2F>ױ<EFBFBD>ʾ
int biYPelsPerMeter ;//<2F><>ֱ<EFBFBD>ֱ<EFBFBD><D6B1>ʣ<EFBFBD><CAA3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>/<2F>ױ<EFBFBD>ʾ
unsigned int biClrUsed ;//λͼʵ<CDBC><CAB5>ʹ<EFBFBD>õIJ<C3B5>ɫ<EFBFBD><C9AB><EFBFBD>е<EFBFBD><D0B5><EFBFBD>ɫ<EFBFBD><C9AB><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ϊ0<CEAA>Ļ<EFBFBD><C4BB><EFBFBD><EFBFBD><EFBFBD>˵<EFBFBD><CBB5>ʹ<EFBFBD><CAB9><EFBFBD><EFBFBD><EFBFBD>е<EFBFBD>ɫ<EFBFBD><C9AB><EFBFBD>
unsigned int biClrImportant ;//<2F><>ͼ<EFBFBD><CDBC><EFBFBD><EFBFBD>ʾ<EFBFBD><CABE><EFBFBD><EFBFBD>ҪӰ<D2AA><D3B0><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɫ<EFBFBD><C9AB><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ŀ<EFBFBD><C4BF><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>0<EFBFBD><30><EFBFBD><EFBFBD>ʾ<EFBFBD><CABE><EFBFBD><EFBFBD>Ҫ<EFBFBD><D2AA>
}BMPINFO;
typedef struct tagRGBQUAD
{
unsigned char rgbBlue;
unsigned char rgbGreen;
unsigned char rgbRed;
unsigned char rgbReserved;
} RGBQUAD;
typedef struct tagBITMAPINFO
{
BMPINFO bmiHeader;
//RGBQUAD bmiColors[1];
unsigned int rgb[3];
} BITMAPINFO;
static int get_rgb565_header(int w, int h, BMPHEADER * head, BITMAPINFO * info)
{
int size = 0;
if (head && info)
{
size = w * h * 2;
memset(head, 0, sizeof(* head));
memset(info, 0, sizeof(* info));
head->bfType[0] = 'B';
head->bfType[1] = 'M';
head->bfOffBits = 14 + sizeof(* info);
head->bfSize = head->bfOffBits + size;
head->bfSize = (head->bfSize + 3) & ~3;
size = head->bfSize - head->bfOffBits;
info->bmiHeader.biSize = sizeof(info->bmiHeader);
info->bmiHeader.biWidth = w;
info->bmiHeader.biHeight = -h;
info->bmiHeader.biPlanes = 1;
info->bmiHeader.biBitCount = 16;
info->bmiHeader.biCompression = BI_BITFIELDS;
info->bmiHeader.biSizeImage = size;
info->rgb[0] = 0xF800;
info->rgb[1] = 0x07E0;
info->rgb[2] = 0x001F;
logd("rgb565:%dbit,%d*%d,%d\n", info->bmiHeader.biBitCount, w, h, head->bfSize);
}
return size;
}
static int save_bmp_rgb565(FILE* fp, int width, int height, unsigned char* pData)
{
int success = 0;
int size = 0;
BMPHEADER head;
BITMAPINFO info;
size = get_rgb565_header(width, height, &head, &info);
if(size > 0)
{
fwrite(head.bfType,1,2,fp);
fwrite(&head.bfSize,1,4,fp);
fwrite(&head.bfReserved1,1,4,fp);
fwrite(&head.bfOffBits,1,4,fp);
fwrite(&info,1,sizeof(info), fp);
fwrite(pData,1,size, fp);
success = 1;
}
logd("*****success=%d\n", success);
return success;
}
#endif
// B = 1.164 * (Y - 16) + 2.018 * (U - 128)
// G = 1.164 * (Y - 16) - 0.813 * (V - 128) - 0.391 * (U - 128)
// R = 1.164 * (Y - 16) + 1.596 * (V - 128)
// B = 298/256 * (Y - 16) + 517/256 * (U - 128)
// G = .................. - 208/256 * (V - 128) - 100/256 * (U - 128)
// R = .................. + 409/256 * (V - 128)
// min_B = (298 * (- 16) + 517 * (- 128)) / 256 = -277
// min_G = (298 * (- 16) - 208 * (255 - 128) - 100 * (255 - 128)) / 256 = -172
// min_R = (298 * (- 16) + 409 * (- 128)) / 256 = -223
// max_B = (298 * (255 - 16) + 517 * (255 - 128)) / 256 = 534
// max_G = (298 * (255 - 16) - 208 * (- 128) - 100 * (- 128)) / 256 = 432
// max_R = (298 * (255 - 16) + 409 * (255 - 128)) / 256 = 481
// clip range -278 .. 535
typedef struct {
int nPicWidth;
int nPicHeight;
unsigned char* pData;
unsigned int nDataSize;
}RgbVideoFrame;
2018-12-13 10:48:25 +00:00
static int transformPictureNV21ToRGB565(struct ScMemOpsS *memOps,
VideoPicture * pPicture,
XVideoFrame* pVideoFrame)
{
unsigned short* pDst;
unsigned char* pSrcY;
unsigned char* pSrcU;
int y;
int x;
unsigned char* pClipTable;
unsigned char* pClip;
static const int nClipMin = -278;
static const int nClipMax = 535;
if((pPicture->ePixelFormat!= PIXEL_FORMAT_NV12) &&
(pPicture->ePixelFormat!= PIXEL_FORMAT_NV21))
{
loge("source pixel format is not NV12, quit.");
return -1;
}
//* initialize the clip table.
pClipTable = (unsigned char*)malloc(nClipMax - nClipMin + 1);
if(pClipTable == NULL)
{
loge("can not allocate memory for the clip table, quit.");
return -1;
}
for(x=nClipMin; x<=nClipMax; x++)
{
pClipTable[x-nClipMin] = (x<0) ? 0 : (x>255) ? 255 : x;
}
pClip = &pClipTable[-nClipMin];
//* flush cache.
CdcMemFlushCache(memOps, pPicture->pData0, pPicture->nLineStride*pPicture->nHeight);
CdcMemFlushCache(memOps, pPicture->pData1, pPicture->nLineStride*pPicture->nHeight/2);
//* set pointers.
pDst = (unsigned short*)pVideoFrame->mData;
pSrcY = (unsigned char*)pPicture->pData0 + pPicture->nTopOffset * \
pPicture->nLineStride + pPicture->nLeftOffset;
pSrcU = (unsigned char*)pPicture->pData1 + (pPicture->nTopOffset/2) * \
(pPicture->nLineStride/2) + pPicture->nLeftOffset/2;
signed y1, y2;
signed u, v;
for(y = 0; y < (int)pVideoFrame->mHeight; ++y)
{
for(x = 0; x < (int)pVideoFrame->mWidth; x += 2)
{
y1 = (signed)pSrcY[x] - 16;
y2 = (signed)pSrcY[x + 1] - 16;
if(pPicture->ePixelFormat == PIXEL_FORMAT_NV12)
{
u = (signed)pSrcU[x] - 128;
v = (signed)pSrcU[x + 1] - 128;
}
else
{
v = (signed)pSrcU[x] - 128;
u = (signed)pSrcU[x + 1] - 128;
}
signed u_b = u * 517;
signed u_g = -u * 100;
signed v_g = -v * 208;
signed v_r = v * 409;
signed tmp1 = y1 * 298;
signed b1 = (tmp1 + u_b) / 256;
signed g1 = (tmp1 + v_g + u_g) / 256;
signed r1 = (tmp1 + v_r) / 256;
signed tmp2 = y2 * 298;
signed b2 = (tmp2 + u_b) / 256;
signed g2 = (tmp2 + v_g + u_g) / 256;
signed r2 = (tmp2 + v_r) / 256;
unsigned int rgb1 = ((pClip[r1] >> 3) << 11) |
((pClip[g1] >> 2) << 5) |
(pClip[b1] >> 3);
unsigned int rgb2 = ((pClip[r2] >> 3) << 11) |
((pClip[g2] >> 2) << 5) |
(pClip[b2] >> 3);
*(unsigned int *)(&pDst[x]) = (rgb2 << 16) | rgb1;
}
pSrcY += pPicture->nLineStride;
if(y & 1)
{
pSrcU += pPicture->nLineStride;
}
pDst += pVideoFrame->mWidth;
}
free(pClipTable);
return 0;
}
2018-07-13 01:31:50 +00:00
static int transformPictureMb32ToRGB(struct ScMemOpsS *memOps,
VideoPicture * pPicture,
XVideoFrame* pVideoFrame)
{
unsigned char* pClipTable;
unsigned char* pClip;
static const int nClipMin = -278;
static const int nClipMax = 535;
unsigned short* pDst = NULL;
unsigned char* pSrcY = NULL;
unsigned char* pSrcVU = NULL;
int x = 0;
int y = 0;
int nMbWidth = 0;
int nMbHeight = 0;
int nVMb = 0;
int nHMb = 0;
int yPos = 0;
int pos = 0;
int uvPos = 0;
// <20><><EFBFBD>Խ<EFBFBD>pClipTable <20>Բ<EFBFBD><D4B2><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ʽ<EFBFBD><CABD><EFBFBD><EFBFBD>transformPictureMb32ToRGB
//* initialize the clip table.
pClipTable = (unsigned char*)malloc(nClipMax - nClipMin + 1);
if(pClipTable == NULL)
{
loge("can not allocate memory for the clip table, quit.");
return -1;
}
for(x=nClipMin; x<=nClipMax; x++)
{
pClipTable[x-nClipMin] = (x<0) ? 0 : (x>255) ? 255 : x;
}
pClip = &pClipTable[-nClipMin];
//* flush cache.
CdcMemFlushCache(memOps, pPicture->pData0, pPicture->nWidth*pPicture->nHeight);
CdcMemFlushCache(memOps, pPicture->pData1, pPicture->nHeight*pPicture->nHeight/2);
pDst = (unsigned short*)pVideoFrame->mData;
pSrcY = (unsigned char*)pPicture->pData0;
pSrcVU = (unsigned char*)pPicture->pData1;
nMbWidth = pPicture->nWidth/32;
nMbHeight = pPicture->nHeight/32;
for(nVMb=0; nVMb<nMbHeight;nVMb++)
{
for(nHMb=0; nHMb<nMbWidth; nHMb++)
{
pos = nVMb*pPicture->nWidth*32+nHMb*32;
for(y=0; y<32; y++)
{
yPos = (nVMb*nMbWidth+nHMb)*1024+y*32;
uvPos = ((nVMb/2)*nMbWidth*1024)+nHMb*1024+(y/2)*32+ (((nVMb%2)==1) ? 512 : 0);
for(x=0; x<32; x+=2)
{
signed y1 = (signed)pSrcY[yPos+x+0] - 16;
signed y2 = (signed)pSrcY[yPos+x+1] - 16;
signed u = (signed)pSrcVU[uvPos+x+0] - 128;
signed v = (signed)pSrcVU[uvPos+x+1] - 128;
signed u_b = u * 517;
signed u_g = -u * 100;
signed v_g = -v * 208;
signed v_r = v * 409;
signed tmp1 = y1 * 298;
signed b1 = (tmp1 + u_b) / 256;
signed g1 = (tmp1 + v_g + u_g) / 256;
signed r1 = (tmp1 + v_r) / 256;
signed tmp2 = y2 * 298;
signed b2 = (tmp2 + u_b) / 256;
signed g2 = (tmp2 + v_g + u_g) / 256;
signed r2 = (tmp2 + v_r) / 256;
unsigned int rgb1 = ((pClip[r1] >> 3) << 11) |
((pClip[g1] >> 2) << 5) |
(pClip[b1] >> 3);
unsigned int rgb2 = ((pClip[r2] >> 3) << 11) |
((pClip[g2] >> 2) << 5) |
(pClip[b2] >> 3);
*(unsigned int *)(&pDst[pos]) = (rgb2 << 16) | rgb1;
pos += 2;
}
pos += (nMbWidth-1)*32;
}
}
}
pDst = (unsigned short*)pVideoFrame->mData;
for(y=0; y<pPicture->nTopOffset; y++)
{
memset(pDst+y*pVideoFrame->mWidth, 0, 2*pVideoFrame->mWidth);
}
for(y=pPicture->nBottomOffset; y<(int)pVideoFrame->mHeight; y++)
{
memset(pDst+y*pVideoFrame->mWidth, 0, 2*pVideoFrame->mWidth);
}
for(y=pPicture->nTopOffset; y<pPicture->nBottomOffset; y++)
{
memset(pDst+y*pVideoFrame->mWidth, 0, 2*pPicture->nLeftOffset);
memset(pDst+y*pVideoFrame->mWidth+pPicture->nRightOffset, 0,
2*(pVideoFrame->mWidth-pPicture->nRightOffset));
}
free(pClipTable);
#if SAVE_RGB
FILE* outFp = fopen("/data/UDISK/rgb.bmp", "wb");
if(outFp != NULL)
{
logd("************save_bmp_rgb565\n");
save_bmp_rgb565(outFp, pVideoFrame->mWidth, pVideoFrame->mHeight, pVideoFrame->mData);
fclose(outFp);
}
#endif
return 0;
}
static int transformPicture(struct ScMemOpsS *memOps,
VideoPicture * pPicture,
XVideoFrame* pVideoFrame);
static void clear(XRetriever* v)
{
XRetrieverContext* p;
p = (XRetrieverContext*)v;
if(p->mParser)
{
CdxParserForceStop(p->mParser); //* to prevend parser from blocking at a network io.
CdxParserClose(p->mParser);
p->mParser = NULL;
p->mStream = NULL;
}
else if(p->mStream)
{
CdxStreamForceStop(p->mStream);
CdxStreamClose(p->mStream);
p->mStream = NULL;
}
if(p->mVideoDecoder != NULL)
{
DestroyVideoDecoder(p->mVideoDecoder);
p->mVideoDecoder = NULL;
}
if(p->mSource.uri)
{
free(p->mSource.uri);
}
memset(&p->mMediaInfo, 0, sizeof(CdxMediaInfoT));
if(p->mVideoFrame.mData)
{
free(p->mVideoFrame.mData);
p->mVideoFrame.mData = NULL;
}
memset(&p->mVideoFrame, 0x00, sizeof(XVideoFrame));
if(p->mVideoStream.mBuf)
{
free(p->mVideoStream.mBuf);
p->mVideoStream.mBuf = NULL;
}
memset(&p->mVideoStream, 0x00, sizeof(XVideoStream));
return;
}
XRetriever* XRetrieverCreate()
{
XRetrieverContext* p;
p = (XRetrieverContext*)malloc(sizeof(XRetrieverContext));
if(!p)
{
return NULL;
}
memset(p, 0x00, sizeof(XRetrieverContext));
memset(&p->mSource, 0, sizeof(CdxDataSourceT));
p->memops = MemAdapterGetOpsS();
if(p->memops == NULL)
{
free(p);
return NULL;
}
CdcMemOpen(p->memops);
return (XRetriever*)p;
}
int XRetrieverDestory(XRetriever* v)
{
XRetrieverContext* p;
p = (XRetrieverContext*)v;
clear(v);
CdcMemClose(p->memops);
free(p);
return 0;
}
static int retrieverSetDataSource(XRetrieverContext* p, const char* pUrl,
const CdxKeyedVectorT* pHeaders)
{
if(strstr(pUrl, "://") != NULL)
{
p->mSource.uri = strdup(pUrl);
if(p->mSource.uri == NULL)
{
loge("can not dump string of uri.");
return -1;
}
}
else
{
p->mSource.uri = (char*)malloc(strlen(pUrl)+8);
if(p->mSource.uri == NULL)
{
loge("can not dump string of uri.");
return -1;
}
sprintf(p->mSource.uri, "file://%s", pUrl);
}
if(pHeaders != NULL &&
(!strncasecmp("http://", pUrl, 7) || !strncasecmp("https://", pUrl, 8)))
{
//todo: set headers
int nHeaderSize = CdxKeyedVectorGetSize((CdxKeyedVectorT*)pHeaders);
if(nHeaderSize > 0)
{
p->mSource.extraDataType = EXTRA_DATA_HTTP_HEADER;
}
}
return 0;
}
int XRetrieverSetDataSource(XRetriever* v, const char* pUrl, const CdxKeyedVectorT* pHeaders)
{
int ret;
XRetrieverContext* p;
p = (XRetrieverContext*)v;
clear(v);
//* 1. set the datasource object.
ret = retrieverSetDataSource(p, pUrl, pHeaders);
if(ret < 0)
{
loge("set datasource fail.");
return -1;
}
logd("uri: %s", p->mSource.uri);
//* 2. create a parser.
p->mStream = CdxStreamCreate(&p->mSource);
if(!p->mStream)
{
loge("stream creat fail.");
return -1;
}
ret = CdxStreamConnect(p->mStream);
if(ret < 0)
{
return -1;
}
p->mParser = CdxParserCreate(p->mStream, MUTIL_AUDIO);
if(!p->mParser)
{
loge("parser creat fail.");
return -1;
}
ret = CdxParserInit(p->mParser);
if(ret < 0)
{
return -1;
}
//* 3. get media info.
memset(&p->mMediaInfo, 0, sizeof(CdxMediaInfoT));
if(CdxParserGetMediaInfo(p->mParser, &p->mMediaInfo) == 0)
{
if (p->mParser->type == CDX_PARSER_TS ||
p->mParser->type == CDX_PARSER_BD ||
p->mParser->type == CDX_PARSER_HLS)
{
p->mMediaInfo.program[0].video[0].bIsFramePackage = 0; /* stream package */
}
else
{
p->mMediaInfo.program[0].video[0].bIsFramePackage = 1; /* frame package */
}
}
return 0;
}
static void setScaleRatio(VConfig *vconfig, VideoStreamInfo *videoInfo,
int *hScaleRatio, int *vScaleRatio)
{
int wider = 640, widest = 1280;
int higher = 480, highest = 960;
if (vconfig->nRotateDegree == 1 || vconfig->nRotateDegree == 3)
{
wider = 480;
widest = 960;
higher = 640;
highest = 1280;
}
if(videoInfo->nWidth > widest || videoInfo->nWidth == 0)
*hScaleRatio = 2; //* scale down to 1/4 the original width;
else if(videoInfo->nWidth > wider)
*hScaleRatio = 1; //* scale down to 1/2 the original width;
if(videoInfo->nHeight > highest || videoInfo->nHeight == 0)
*vScaleRatio = 2; //* scale down to 1/4 the original height;
else if(videoInfo->nHeight > higher)
*vScaleRatio = 1; //* scale down to 1/2 the original height;
}
2018-12-13 10:48:25 +00:00
//* option = 0 means seek to the sync frame privious to the timeUs.
//* option = 1 means seek to the sync frame next to the timeUs.
//* option = 2 means seek to the sync frame closest to the timeUs.
//* option = 3 means seek to the closest frame to the timeUs.
XVideoFrame *XRetrieverGetFrameAtTime(XRetriever* v, int64_t timeUs, int option)
2018-07-13 01:31:50 +00:00
{
VideoPicture* pPicture;
int bDone;
int bSuccess;
int bHasVideo;
int nHorizonScaleRatio;
int nVerticalScaleRatio;
VConfig vconfig;
CdxPacketT packet;
int ret;
int nPacketCount;
int64_t nStartTime;
int64_t nTimePassed;
XRetrieverContext* p;
p = (XRetrieverContext*)v;
//* FIXME:
//* if it is a media file with drm protection, we should not return an album art picture.
bDone = 0;
bSuccess = 0;
bHasVideo = 0;
memset(&vconfig, 0, sizeof(VConfig));
//* 1. check whether there is a video stream.
if(p->mMediaInfo.programIndex >= 0 && p->mMediaInfo.programNum >= p->mMediaInfo.programIndex)
{
if(p->mMediaInfo.program[p->mMediaInfo.programIndex].videoNum > 0)
bHasVideo = 1;
}
if(!bHasVideo)
{
logw("media file do not contain a video stream, getFrameAtTime() return fail.");
return NULL;
}
//* 2. create a video decoder.
if(p->mVideoDecoder == NULL)
{
p->mVideoDecoder = CreateVideoDecoder();
//* use decoder to capture thumbnail, decoder use less memory in this mode.
2018-12-13 10:48:25 +00:00
if(option == 3)
{
vconfig.bThumbnailMode = 0;
}
else
{
vconfig.bThumbnailMode = 1;
}
2018-07-13 01:31:50 +00:00
//* all decoder support YV12 format.
// some chip not support yv12, we should set PIXEL_FORMAT_YUV_MB32_420;
const char *vd_outfmt = GetConfigParamterString("vd_output_fmt", NULL);
CDX_LOG_CHECK(vd_outfmt, "vd_output_fmt NULL, pls check your config.");
if (strcmp(vd_outfmt, "mb32") == 0)
{
vconfig.eOutputPixelFormat = PIXEL_FORMAT_YUV_MB32_420;
}
else
{
logd("set default format: yv12");
vconfig.eOutputPixelFormat = PIXEL_FORMAT_YV12;
}
//* no need to decode two picture when decoding a thumbnail picture.
vconfig.bDisable3D = 1;
vconfig.nAlignStride = 16;//* set align stride to 16 as defualt
#if 1
//* set this flag when the parser can give this info,
//* mov files recorded by iphone or android phone
//* conains this info.
//* set the rotation
int nRotateDegree;
int nRotation = atoi((const char*)p->mMediaInfo.rotate);
if(nRotation == 0)
nRotateDegree = 0;
else if(nRotation == 90)
nRotateDegree = 1;
else if(nRotation == 180)
nRotateDegree = 2;
else if(nRotation == 270)
nRotateDegree = 3;
else
nRotateDegree = 0;
if(nRotateDegree != 0)
{
vconfig.bRotationEn = 1;
vconfig.nRotateDegree = nRotateDegree;
}
else
{
vconfig.bRotationEn = 0;
vconfig.nRotateDegree = 0;
}
#endif
//* set the picture scale down ratio,
//* we generate a picture with pixel size less than 640x480.
nHorizonScaleRatio = 0;
nVerticalScaleRatio = 0;
VideoStreamInfo *videoInfo =
p->mMediaInfo.program[p->mMediaInfo.programIndex].video;
setScaleRatio(&vconfig, videoInfo, &nHorizonScaleRatio, &nVerticalScaleRatio);
#if 0
if(vconfig.nRotateDegree == 1 || vconfig.nRotateDegree == 3)
{
/* nWidth=0 treated as nWidth=1920 */
if(videoInfo.nWidth > 960 ||
videoInfo.nWidth == 0)
nHorizonScaleRatio = 2; //* scale down to 1/4 the original width;
else if(videoInfo.nWidth > 480)
nHorizonScaleRatio = 1; //* scale down to 1/2 the original width;
/* nHeight=0 treated as nHeight=1080 */
if(videoInfo.nHeight > 1280 ||
videoInfo.nHeight == 0)
nVerticalScaleRatio = 2; //* scale down to 1/4 the original height;
else if(videoInfo.nHeight > 640)
nVerticalScaleRatio = 1; //* scale down to 1/2 the original height;
}
else
{
/* nWidth=0 treated as nWidth=1920 */
if(videoInfo.nWidth > 1280 ||
videoInfo.nWidth == 0)
nHorizonScaleRatio = 2; //* scale down to 1/4 the original width;
else if(videoInfo.nWidth > 640)
nHorizonScaleRatio = 1; //* scale down to 1/2 the original width;
/* nHeight=0 treated as nHeight=1080 */
if(videoInfo.nHeight > 960 ||
videoInfo.nHeight == 0)
nVerticalScaleRatio = 2; //* scale down to 1/4 the original height;
else if(videoInfo.nHeight > 480)
nVerticalScaleRatio = 1; //* scale down to 1/2 the original height;
}
#endif
//* set to the same scale ratio.
if(nVerticalScaleRatio > nHorizonScaleRatio)
nHorizonScaleRatio = nVerticalScaleRatio;
else
nVerticalScaleRatio = nHorizonScaleRatio;
//* set scale ratio to vconfig.
if(nHorizonScaleRatio || nVerticalScaleRatio)
{
vconfig.bScaleDownEn = 1;
vconfig.nHorizonScaleDownRatio = nHorizonScaleRatio;
vconfig.nVerticalScaleDownRatio = nVerticalScaleRatio;
}
//* initialize the decoder.
vconfig.nVbvBufferSize = 2*1024*1024;
2018-12-13 10:48:25 +00:00
if(videoInfo->nWidth > 3800)
vconfig.nVbvBufferSize = 4*1024*1024;
2018-07-13 01:31:50 +00:00
//###check
vconfig.nDeInterlaceHoldingFrameBufferNum = 0;//GetConfigParamterInt("pic_4di_num", 2);
vconfig.nDisplayHoldingFrameBufferNum = 0;
vconfig.nRotateHoldingFrameBufferNum = GetConfigParamterInt("pic_4rotate_num", 0);
vconfig.nDecodeSmoothFrameBufferNum = GetConfigParamterInt("pic_4smooth_num", 3);
2018-12-13 10:48:25 +00:00
vconfig.bConvertVp910bitTo8bit = 1;
2018-07-13 01:31:50 +00:00
vconfig.memops = p->memops;
if(InitializeVideoDecoder(p->mVideoDecoder,
videoInfo, &vconfig) != 0)
{
loge("initialize video decoder fail.");
return NULL;
}
}
if(timeUs < 0)
{
//The key frame of MKV always at the end of file, need reset to 0,
//otherwise will return mix thumbnail
if(p->mParser->type == CDX_PARSER_MKV)
{
timeUs = 0;
}
else
{
timeUs = ((int64_t)p->mMediaInfo.program[p->mMediaInfo.programIndex].duration*1000/2);
}
}
2018-12-13 10:48:25 +00:00
if(p->mMediaInfo.program[p->mMediaInfo.programIndex].duration < 20000)
2018-07-13 01:31:50 +00:00
{
timeUs = 0;
}
//* 3. seek parser to the specific position.
if(p->mMediaInfo.bSeekable && timeUs > 0 &&
timeUs < ((int64_t)p->mMediaInfo.program[p->mMediaInfo.programIndex].duration*1000))
{
2018-12-13 10:48:25 +00:00
SeekModeType nSeekModeType;
nSeekModeType = AW_SEEK_THUMBNAIL;
if(option == 2)
2018-07-13 01:31:50 +00:00
{
2018-12-13 10:48:25 +00:00
nSeekModeType = AW_SEEK_CLOSEST_SYNC;
}
if(CdxParserSeekTo(p->mParser, timeUs, nSeekModeType) != 0)
{
logw("seek media file error at the specific time %" PRId64 " us.", timeUs);
if(CdxParserSeekTo(p->mParser, 0, nSeekModeType) != 0)
{
loge("seek media file error at the time 0");
return NULL;
}
2018-07-13 01:31:50 +00:00
}
}
else
{
logw("media file do not support seek operation, get frame from the begin.");
}
//* 4. loop to decode a picture.
nPacketCount = 0;
nStartTime = GetSysTime();
2018-12-13 10:48:25 +00:00
int64_t first_pts;
int first_flag = 0;
2018-07-13 01:31:50 +00:00
do
{
//* 4.1 prefetch packet type and packet data size.
packet.flags = 0;
if(CdxParserPrefetch(p->mParser, &packet) != 0)
{
//* prefetch fail, may be file end reached.
bDone = 1;
bSuccess = 0;
break;
}
//* 4.2 feed data to the video decoder.
if(packet.type == CDX_MEDIA_VIDEO && (packet.flags&MINOR_STREAM)==0)
{
ret = RequestVideoStreamBuffer(p->mVideoDecoder,
packet.length,
(char**)&packet.buf,
&packet.buflen,
(char**)&packet.ringBuf,
&packet.ringBufLen,
0);
if(ret==0 && (packet.buflen+packet.ringBufLen)>=packet.length)
{
2018-12-13 10:48:25 +00:00
if(first_flag == 0)
{
first_pts = packet.pts;
first_flag = 1;
}
2018-07-13 01:31:50 +00:00
nPacketCount++;
if(CdxParserRead(p->mParser, &packet) == 0)
{
VideoStreamDataInfo dataInfo;
dataInfo.pData = (char*)packet.buf;
dataInfo.nLength = packet.length;
dataInfo.nPts = packet.pts;
dataInfo.nPcr = -1;
dataInfo.bIsFirstPart = 1;
dataInfo.bIsLastPart = 1;
dataInfo.nStreamIndex = 0;
SubmitVideoStreamData(p->mVideoDecoder, &dataInfo, 0);
}
else
{
//* read data fail, may be data error.
loge("read packet from parser fail.");
bDone = 1;
bSuccess = 0;
break;
}
}
else
{
//* no buffer, may be the decoder is full of stream.
logw("waiting for stream buffer.");
}
}
else
{
//* only process the major video stream.
//* allocate a buffer to read uncare media data and skip it.
packet.buf = malloc(packet.length);
if(packet.buf != NULL)
{
nPacketCount++;
packet.buflen = packet.length;
packet.ringBuf = NULL;
packet.ringBufLen = 0;
if(CdxParserRead(p->mParser, &packet) == 0)
{
free(packet.buf);
continue;
}
else
{
free(packet.buf);
//* read data fail, may be data error.
loge("read packet from parser fail.");
bDone = 1;
bSuccess = 0;
break;
}
}
else
{
loge("can not allocate buffer for none video packet.");
bDone = 1;
bSuccess = 0;
break;
}
}
//* 4.3 decode stream.
ret = DecodeVideoStream(p->mVideoDecoder, 0 /*eos*/,
0/*key frame only*/, 0/*drop b frame*/, 0/*current time*/);
if(ret < 0)
{
loge("decode stream return fail.");
bDone = 1;
bSuccess = 0;
break;
}
else if(ret == VDECODE_RESULT_RESOLUTION_CHANGE)
{
logi("video resolution changed.");
ReopenVideoEngine(p->mVideoDecoder, &vconfig,
&p->mMediaInfo.program[p->mMediaInfo.programIndex].video[0]);
continue;
}
//* 4.4 try to get a picture from the decoder.
if(ret == VDECODE_RESULT_FRAME_DECODED || ret == VDECODE_RESULT_KEYFRAME_DECODED)
{
pPicture = RequestPicture(p->mVideoDecoder, 0/*the major stream*/);
if(pPicture != NULL)
{
2018-12-13 10:48:25 +00:00
if(ret == VDECODE_RESULT_KEYFRAME_DECODED)
{
if(option == 3)
{
if(timeUs - pPicture->nPts < 16666)
{
bDone = 1;
bSuccess = 1;
break;
}
else
{
ReturnPicture(p->mVideoDecoder,pPicture);
pPicture = NULL;
}
}
else
{
if(option == 1)
{
if(pPicture->nPts >= timeUs)
{
bDone = 1;
bSuccess = 1;
break;
}
else
{
ReturnPicture(p->mVideoDecoder,pPicture);
pPicture = NULL;
}
}
if(option == 0 || option == 2)
{
bDone = 1;
bSuccess = 1;
break;
}
}
}
else
{
if(option == 3)
{
if(timeUs - pPicture->nPts < 16666)
{
bDone = 1;
bSuccess = 1;
break;
}
else
{
ReturnPicture(p->mVideoDecoder,pPicture);
pPicture = NULL;
}
}
else
{
ReturnPicture(p->mVideoDecoder,pPicture);
pPicture = NULL;
}
}
2018-07-13 01:31:50 +00:00
}
}
//* check whether cost too long time or process too much packets.
nTimePassed = GetSysTime() - nStartTime;
if(nTimePassed > MAX_TIME_TO_GET_A_FRAME || nTimePassed < 0)
{
logw("cost more than %d us but can not get a picture, quit.", MAX_TIME_TO_GET_A_FRAME);
bDone = 1;
bSuccess = 0;
break;
}
if(nPacketCount > MAX_PACKET_COUNT_TO_GET_A_FRAME)
{
logw("process more than %d packets but can not get a picture, quit.",
MAX_PACKET_COUNT_TO_GET_A_FRAME);
bDone = 1;
bSuccess = 0;
break;
}
}while(!bDone);
//* 5. transform the picture if suceess to get a picture.
if(bSuccess)
{
//* let the width and height is multiple of 2, for convinient of yuv to rgb565 converting.
if(pPicture->nLeftOffset & 1)
pPicture->nLeftOffset += 1;
if(pPicture->nRightOffset & 1)
pPicture->nRightOffset -= 1;
if(pPicture->nTopOffset & 1)
pPicture->nTopOffset += 1;
if(pPicture->nBottomOffset & 1)
pPicture->nBottomOffset -= 1;
//* I find that the mpeg2 decoder output the original picture's crop params,
//* it is bigger than the scaledown picture's size.
if((pPicture->nBottomOffset != 0 || pPicture->nRightOffset != 0) &&
pPicture->nRightOffset <= pPicture->nLineStride)
{
p->mVideoFrame.mDisplayWidth = pPicture->nRightOffset - pPicture->nLeftOffset;
p->mVideoFrame.mDisplayHeight = pPicture->nBottomOffset - pPicture->nTopOffset;
p->mVideoFrame.mWidth = p->mVideoFrame.mDisplayWidth;
p->mVideoFrame.mHeight = p->mVideoFrame.mDisplayHeight;
}
else
{
p->mVideoFrame.mDisplayWidth = pPicture->nWidth;
p->mVideoFrame.mDisplayHeight = pPicture->nHeight;
p->mVideoFrame.mWidth = pPicture->nWidth;
p->mVideoFrame.mHeight = pPicture->nHeight;
}
if(pPicture->ePixelFormat == PIXEL_FORMAT_YUV_MB32_420)
{
// for 1663, mb32
p->mVideoFrame.mDisplayWidth = pPicture->nWidth;
p->mVideoFrame.mDisplayHeight = pPicture->nHeight;
p->mVideoFrame.mWidth = pPicture->nWidth;
p->mVideoFrame.mHeight = pPicture->nHeight;
p->mVideoFrame.mSize = p->mVideoFrame.mWidth * p->mVideoFrame.mHeight * 2;
p->mVideoFrame.mData = (unsigned char*)malloc(p->mVideoFrame.mSize);
if(p->mVideoFrame.mData == NULL)
{
loge("can not allocate memory for video frame.");
return NULL;
}
}
else
{
//* for RGB565 pixel format.
p->mVideoFrame.mSize = p->mVideoFrame.mWidth * p->mVideoFrame.mHeight * 2;
p->mVideoFrame.mData = (unsigned char*)malloc(p->mVideoFrame.mSize);
if(p->mVideoFrame.mData == NULL)
{
loge("can not allocate memory for video frame.");
return NULL;
}
}
p->mVideoFrame.mRotationAngle = 0;
if(pPicture->ePixelFormat == PIXEL_FORMAT_YUV_MB32_420)
{
//* convert pixel format.
if(transformPictureMb32ToRGB(p->memops, pPicture, &p->mVideoFrame) < 0)
{
return NULL;
}
}
2018-12-13 10:48:25 +00:00
else if(pPicture->ePixelFormat == PIXEL_FORMAT_NV12
|| pPicture->ePixelFormat == PIXEL_FORMAT_NV21)
{
if(transformPictureNV21ToRGB565(p->memops, pPicture, &p->mVideoFrame) < 0)
{
return NULL;
}
}
2018-07-13 01:31:50 +00:00
else
{
if(transformPicture(p->memops, pPicture, &p->mVideoFrame) < 0)
{
return NULL;
}
}
2018-12-13 10:48:25 +00:00
ReturnPicture(p->mVideoDecoder,pPicture);
pPicture = NULL;
ResetVideoDecoder(p->mVideoDecoder);
2018-07-13 01:31:50 +00:00
return &p->mVideoFrame;
}
else
{
loge("cannot decode a picture.");
return NULL;
}
}
XVideoStream *XRetrieverGetStreamAtTime(XRetriever * v,int64_t timeUs)
{
VideoPicture* pPicture;
int bDone;
int bHasVideo;
int nHorizonScaleRatio;
int nVerticalScaleRatio;
enum EPIXELFORMAT ePixelFormat;
VConfig vconfig;
CdxPacketT packet;
int ret;
int64_t nStartTime;
int64_t nTimePassed;
//* for encoder
VencBaseConfig sBaseEncConfig;
VencInputBuffer sInputBuffer;
VencOutputBuffer sOutputBuffer;
VencHeaderData spsppsInfo;
VencH264Param h264Param;
VideoEncoder* pVideoEncoder = NULL;
int bEncoderInited = 0;
unsigned char* pOutBuf = NULL;
int bBitStreamLength = 0;
int bEncodeAllFrames = 0;
int bFrameCounter = 0;
int videoCodec;
XRetrieverContext* p;
int bErr = 0;
p = (XRetrieverContext*)v;
#if SAVE_BITSTREAM
fph264 = fopen(bitstreamPath, "wb");
#endif
//* FIXME:
//* if it is a media file with drm protection, we should not return an album art picture.
bDone = 0;
bHasVideo = 0;
memset(&vconfig, 0, sizeof(VConfig));
//* 1. check whether there is a video stream.
if(p->mMediaInfo.programIndex >= 0 &&
p->mMediaInfo.programNum >= p->mMediaInfo.programIndex)
{
if(p->mMediaInfo.program[p->mMediaInfo.programIndex].videoNum > 0)
bHasVideo = 1;
}
if(!bHasVideo)
{
logw("media file do not contain a video stream, getFrameAtTime() return fail.");
bErr = 1;
goto NEED_EXIT;
}
videoCodec =
p->mMediaInfo.program[p->mMediaInfo.programIndex].video[0].eCodecFormat;
if(videoCodec == VIDEO_CODEC_FORMAT_WMV1 ||
videoCodec == VIDEO_CODEC_FORMAT_WMV2 ||
videoCodec == VIDEO_CODEC_FORMAT_VP6 ||
videoCodec == VIDEO_CODEC_FORMAT_H265 ||
videoCodec == VIDEO_CODEC_FORMAT_VP9)
{
logw("Soft decoder thumb disable!");
bErr = 1;
goto NEED_EXIT;
}
//* 2. create a video encoder
pVideoEncoder = VideoEncCreate(VENC_CODEC_H264);
if(pVideoEncoder == NULL)
{
bErr = 1;
goto NEED_EXIT;
}
pOutBuf = (unsigned char*)malloc(MAX_OUTPUT_STREAM_SIZE);
if(pOutBuf == NULL)
{
bErr = 1;
goto NEED_EXIT;
}
//* 3. create a video decoder.
if(p->mVideoDecoder == NULL)
{
p->mVideoDecoder = CreateVideoDecoder();
//* use decoder to capture thumbnail, decoder use less memory in this mode.
vconfig.bThumbnailMode = 0;
//* all decoder support YUV_MB32_420 format.
vconfig.eOutputPixelFormat = PIXEL_FORMAT_NV21;
//* no need to decode two picture when decoding a thumbnail picture.
vconfig.bDisable3D = 1;
vconfig.nAlignStride = 16;//* set align stride to 16 as default
#if 1
//* set this flag when the parser can give this info, mov files recorded by
//* iphone or android phone conains this info.
//* set the rotation
int nRotateDegree;
int nRotation = atoi((const char*)p->mMediaInfo.rotate);
if(nRotation == 0)
nRotateDegree = 0;
else if(nRotation == 90)
nRotateDegree = 1;
else if(nRotation == 180)
nRotateDegree = 2;
else if(nRotation == 270)
nRotateDegree = 3;
else
nRotateDegree = 0;
if(nRotateDegree != 0)
{
vconfig.bRotationEn = 1;
vconfig.nRotateDegree = nRotateDegree;
}else
{
vconfig.bRotationEn = 0;
vconfig.nRotateDegree = 0;
}
#endif
/* set the picture scale down ratio, we generate a picture with pixel
* size less than 640x480.
*/
nHorizonScaleRatio = 0;
nVerticalScaleRatio = 0;
VideoStreamInfo *videoInfo =
p->mMediaInfo.program[p->mMediaInfo.programIndex].video;
setScaleRatio(&vconfig, videoInfo, &nHorizonScaleRatio, &nVerticalScaleRatio);
//* set to the same scale ratio.
if(nVerticalScaleRatio > nHorizonScaleRatio)
nHorizonScaleRatio = nVerticalScaleRatio;
else
nVerticalScaleRatio = nHorizonScaleRatio;
//* set scale ratio to vconfig.
if(nHorizonScaleRatio || nVerticalScaleRatio)
{
vconfig.bScaleDownEn = 1;
vconfig.nHorizonScaleDownRatio = nHorizonScaleRatio;
vconfig.nVerticalScaleDownRatio = nVerticalScaleRatio;
}
vconfig.memops = MemAdapterGetOpsS();
//* initialize the decoder.
vconfig.nDeInterlaceHoldingFrameBufferNum = 0;//*not use deinterlace
vconfig.nDisplayHoldingFrameBufferNum = 0;//*gpu and decoder not share buffer
vconfig.nRotateHoldingFrameBufferNum = GetConfigParamterInt("pic_4rotate_num", 0);
vconfig.nDecodeSmoothFrameBufferNum = GetConfigParamterInt("pic_4smooth_num", 3);
if(InitializeVideoDecoder(p->mVideoDecoder, videoInfo, &vconfig) != 0)
{
loge("initialize video decoder fail.");
bErr = 1;
goto NEED_EXIT;
}
}
//* 4. seek parser to the specific position.
if(p->mMediaInfo.bSeekable && timeUs != 0 && timeUs <
((int64_t)p->mMediaInfo.program[p->mMediaInfo.programIndex].duration*1000))
{
//* FIXME.
//* we should seek to a position according to the 'option' param.
//* option = 0 means seek to the sync frame privious to the timeUs.
//* option = 1 means seek to the sync frame next to the timeUs.
//* option = 2 means seek to the sync frame closest to the timeUs.
//* option = 3 means seek to the closest frame to the timeUs.
//* here we process all case as option = 0.
2018-12-13 10:48:25 +00:00
if(CdxParserSeekTo(p->mParser, timeUs, 0) != 0)
2018-07-13 01:31:50 +00:00
{
loge("can not seek media file to the specific time %" PRId64 " us.", timeUs);
bErr = 1;
goto NEED_EXIT;
}
}
else
{
logw("media file do not support seek operation, get frame from the begin.");
}
//* 5. loop to get bitstream.
nStartTime = GetSysTime();
do
{
while(VideoStreamFrameNum(p->mVideoDecoder, 0) < 4)
{
//* 5.1 prefetch packet type and packet data size.
if(CdxParserPrefetch(p->mParser, &packet) != 0)
{
//* prefetch fail, may be file end reached.
bDone = 1;
goto EOS_EXIT;
}
//* 5.2 feed data to the video decoder.
if(packet.type == CDX_MEDIA_VIDEO && (packet.flags&MINOR_STREAM)==0)
{
ret = RequestVideoStreamBuffer(p->mVideoDecoder,
packet.length,
(char**)&packet.buf,
&packet.buflen,
(char**)&packet.ringBuf,
&packet.ringBufLen,
0);
if(ret==0 && (packet.buflen+packet.ringBufLen)>=packet.length)
{
if(CdxParserRead(p->mParser, &packet) == 0)
{
VideoStreamDataInfo dataInfo;
dataInfo.pData = (char*)packet.buf;
dataInfo.nLength = packet.length;
dataInfo.nPts = packet.pts;
dataInfo.nPcr = -1;
dataInfo.bIsFirstPart = 1;
dataInfo.bIsLastPart = 1;
dataInfo.nStreamIndex = 0;
SubmitVideoStreamData(p->mVideoDecoder, &dataInfo, 0);
}
else
{
//* read data fail, may be data error.
loge("read packet from parser fail.");
bDone = 1;
goto EOS_EXIT;
}
}
else
{
//* no buffer, may be the decoder is full of stream.
logw("waiting for stream buffer.");
bDone = 1;
goto EOS_EXIT;
}
}
else
{
//* only process the major video stream.
//* allocate a buffer to read uncare media data and skip it.
packet.buf = malloc(packet.length);
if(packet.buf != NULL)
{
packet.buflen = packet.length;
packet.ringBuf = NULL;
packet.ringBufLen = 0;
if(CdxParserRead(p->mParser, &packet) == 0)
{
free(packet.buf);
continue;
}
else
{
free(packet.buf);
//* read data fail, may be data error.
loge("read packet from parser fail.");
bDone = 1;
goto EOS_EXIT;
}
}
else
{
loge("can not allocate buffer for none video packet.");
bDone = 1;
goto EOS_EXIT;
}
}
}
logv("stream number: %d", VideoStreamFrameNum(p->mVideoDecoder, 0));
//* 5.3 decode stream.
ret = DecodeVideoStream(p->mVideoDecoder, 0 /*eos*/, 0/*key frame only*/,
0/*drop b frame*/, 0/*current time*/);
if(ret < 0)
{
loge("decode stream return fail.");
bDone = 1;
break;
}
else if(ret == VDECODE_RESULT_RESOLUTION_CHANGE)
{
logi("video resolution changed.");
bDone = 1;
break;
}
//* 5.4 try to get a picture from the decoder and encode it.
if(ret == VDECODE_RESULT_FRAME_DECODED || ret == VDECODE_RESULT_KEYFRAME_DECODED)
{
pPicture = RequestPicture(p->mVideoDecoder, 0/*the major stream*/);
if(pPicture != NULL)
{
bFrameCounter++;
int enc_width = 0;
int enc_height = 0;
if(bEncoderInited == 0)
{
//* h264 param
memset(&h264Param, 0, sizeof(VencH264Param));
h264Param.bEntropyCodingCABAC = 1;
h264Param.nBitrate = 150000; /* bps */
h264Param.nCodingMode = VENC_FRAME_CODING;
h264Param.nMaxKeyInterval = 60;
h264Param.sProfileLevel.nProfile = VENC_H264ProfileMain;
h264Param.sProfileLevel.nLevel = VENC_H264Level31;
h264Param.sQPRange.nMinqp = 20;
h264Param.sQPRange.nMaxqp = 40;
VideoEncSetParameter(pVideoEncoder, VENC_IndexParamH264Param, &h264Param);
if(pPicture->nFrameRate > 20000)
{
h264Param.nFramerate = (pPicture->nFrameRate/1000)>>1;
bEncodeAllFrames = 0;
}
else if(pPicture->nFrameRate > 0)
{
h264Param.nFramerate = pPicture->nFrameRate/1000;
bEncodeAllFrames = 1;
}
else
{
h264Param.nFramerate = 15; /* fps */
bEncodeAllFrames = 0;
}
//* init encoder config info
memset(&sBaseEncConfig, 0 ,sizeof(VencBaseConfig));
if((pPicture->nBottomOffset != 0 || pPicture->nRightOffset != 0) &&
pPicture->nRightOffset <= pPicture->nLineStride)
{
enc_width = pPicture->nRightOffset - pPicture->nLeftOffset;
enc_height = pPicture->nBottomOffset - pPicture->nTopOffset;
}
else
{
enc_width = pPicture->nWidth;
enc_height = pPicture->nHeight;
}
sBaseEncConfig.nInputWidth= (pPicture->nWidth);
sBaseEncConfig.nInputHeight = (pPicture->nHeight);
sBaseEncConfig.nStride = pPicture->nLineStride;
sBaseEncConfig.nDstWidth = 256;
sBaseEncConfig.nDstHeight = 144;
sBaseEncConfig.eInputFormat = VENC_PIXEL_YVU420SP;
logd("w:%d, h:%d, stride:%d", sBaseEncConfig.nInputWidth,
sBaseEncConfig.nInputHeight, pPicture->nLineStride);
logd("nRightOffset:%d, nLeftOffset:%d, nBottomOffset:%d, nTopOffset:%d",
pPicture->nRightOffset, pPicture->nLeftOffset,
pPicture->nBottomOffset, pPicture->nTopOffset);
if(VideoEncInit(pVideoEncoder, &sBaseEncConfig)!=0)
{
loge("VideoEncInit failed");
bErr = 1;
goto NEED_EXIT;
}
VideoEncGetParameter(pVideoEncoder, VENC_IndexParamH264SPSPPS, &spsppsInfo);
if(spsppsInfo.pBuffer != 0 &&
(spsppsInfo.nLength + 8 <= MAX_OUTPUT_STREAM_SIZE))
{
int frameRate = h264Param.nFramerate*1000;
pOutBuf[bBitStreamLength++] = 't';
pOutBuf[bBitStreamLength++] = 'h';
pOutBuf[bBitStreamLength++] = 'u';
pOutBuf[bBitStreamLength++] = 'm';
pOutBuf[bBitStreamLength++] = frameRate & 0xff;
pOutBuf[bBitStreamLength++] = (frameRate>>8) & 0xff;
pOutBuf[bBitStreamLength++] = (frameRate>>16) & 0xff;
pOutBuf[bBitStreamLength++] = (frameRate>>24) & 0xff;
pOutBuf[bBitStreamLength++] = spsppsInfo.nLength & 0xff;
pOutBuf[bBitStreamLength++] = (spsppsInfo.nLength>>8) & 0xff;
pOutBuf[bBitStreamLength++] = (spsppsInfo.nLength>>16) & 0xff;
pOutBuf[bBitStreamLength++] = (spsppsInfo.nLength>>24) & 0xff;
memcpy(pOutBuf + bBitStreamLength, (unsigned char*)spsppsInfo.pBuffer,
(int)spsppsInfo.nLength);
bBitStreamLength += spsppsInfo.nLength;
#if SAVE_BITSTREAM
fwrite(spsppsInfo.pBuffer, 1, spsppsInfo.nLength, fph264);
#endif
}
else
{
loge("can not get sps and pps from encoder.");
bErr = 1;
goto NEED_EXIT;
}
bEncoderInited = 1;
}
if(bEncodeAllFrames || (bFrameCounter & 1))
{
if((pPicture->nBottomOffset != 0 || pPicture->nRightOffset != 0) &&
pPicture->nRightOffset <= pPicture->nLineStride)
{
enc_width = pPicture->nRightOffset - pPicture->nLeftOffset;
enc_height = pPicture->nBottomOffset - pPicture->nTopOffset;
}
else
{
enc_width = pPicture->nWidth;
enc_height = pPicture->nHeight;
}
memset(&sInputBuffer, 0, sizeof(VencInputBuffer));
sInputBuffer.pAddrPhyY =
(unsigned char*)CdcMemGetPhysicAddressCpu(p->memops,
pPicture->pData0);
sInputBuffer.pAddrPhyC =
(unsigned char*)CdcMemGetPhysicAddressCpu(p->memops,
pPicture->pData1);
if((enc_width <= pPicture->nWidth) || (enc_height <= pPicture->nHeight))
{
sInputBuffer.bEnableCorp = 1;
sInputBuffer.sCropInfo.nWidth = enc_width;
sInputBuffer.sCropInfo.nHeight= enc_height;
sInputBuffer.sCropInfo.nLeft = pPicture->nLeftOffset;
sInputBuffer.sCropInfo.nTop = pPicture->nTopOffset ;
}
AddOneInputBuffer(pVideoEncoder, &sInputBuffer);
ret = VideoEncodeOneFrame(pVideoEncoder);
if(ret != VENC_RESULT_OK)
{
loge("encoder error");
bErr = 1;
goto NEED_EXIT;
}
AlreadyUsedInputBuffer(pVideoEncoder,&sInputBuffer);
memset(&sOutputBuffer, 0, sizeof(VencOutputBuffer));
GetOneBitstreamFrame(pVideoEncoder, &sOutputBuffer);
if((sOutputBuffer.nSize0 + sOutputBuffer.nSize1 + 4) <= MAX_OUTPUT_STREAM_SIZE)
{
int frameSize = sOutputBuffer.nSize0 + sOutputBuffer.nSize1;
pOutBuf[bBitStreamLength++] = frameSize & 0xff;
pOutBuf[bBitStreamLength++] = (frameSize>>8) & 0xff;
pOutBuf[bBitStreamLength++] = (frameSize>>16) & 0xff;
pOutBuf[bBitStreamLength++] = (frameSize>>24) & 0xff;
memcpy(pOutBuf + bBitStreamLength, sOutputBuffer.pData0,
sOutputBuffer.nSize0);
bBitStreamLength += sOutputBuffer.nSize0;
if(sOutputBuffer.pData1 != NULL && sOutputBuffer.nSize1 > 0)
{
memcpy(pOutBuf + bBitStreamLength, sOutputBuffer.pData1,
sOutputBuffer.nSize1);
bBitStreamLength += sOutputBuffer.nSize1;
}
}
#if SAVE_BITSTREAM
fwrite(sOutputBuffer.pData0, 1, sOutputBuffer.nSize0, fph264);
if(sOutputBuffer.pData1 != NULL && sOutputBuffer.nSize1 > 0)
{
fwrite(sOutputBuffer.pData1, 1, sOutputBuffer.nSize1, fph264);
}
#endif
FreeOneBitStreamFrame(pVideoEncoder, &sOutputBuffer);
}
ReturnPicture(p->mVideoDecoder, pPicture);
}
}
//* check whether cost too long time or process too much packets.
nTimePassed = GetSysTime() - nStartTime;
if(nTimePassed > MAX_TIME_TO_GET_A_STREAM)
{
logw("cost more than %d us to get a steam, quit.", MAX_TIME_TO_GET_A_FRAME);
bDone = 1;
break;
}
if(bFrameCounter >= 150)
{
bDone = 1;
break;
}
}while(!bDone);
EOS_EXIT:
if (pOutBuf && bBitStreamLength)
{
p->mVideoStream.mBuf = pOutBuf;
p->mVideoStream.mSize = bBitStreamLength;
}
logv("bBitStreamLength: %p,%d", pOutBuf, bBitStreamLength);
NEED_EXIT:
if(pVideoEncoder)
{
VideoEncUnInit(pVideoEncoder);
VideoEncDestroy(pVideoEncoder);
pVideoEncoder = NULL;
}
if(pOutBuf)
{
free(pOutBuf);
pOutBuf = NULL;
}
if(p->mVideoDecoder)
{
DestroyVideoDecoder(p->mVideoDecoder);
p->mVideoDecoder = NULL;
}
#if SAVE_BITSTREAM
fclose(fph264);
fph264 = NULL;
#endif
if(bErr == 1)
return NULL;
else
return &p->mVideoStream;
}
int XRetrieverGetMetaData(XRetriever* v, int type, void* pVal)
{
XRetrieverContext* p;
p = (XRetrieverContext*)v;
switch(type)
{
case METADATA_VIDEO_WIDTH:
{
int *w = (int*)pVal;
logd("w: %d", p->mMediaInfo.program[0].video[0].nWidth);
*w = p->mMediaInfo.program[0].video[0].nWidth;
break;
}
case METADATA_VIDEO_HEIGHT:
{
int *h = (int*)pVal;
logd("h: %d", p->mMediaInfo.program[0].video[0].nHeight);
*h = p->mMediaInfo.program[0].video[0].nHeight;
break;
}
case METADATA_DURATION:
{
int *duration = (int*)pVal;
*duration = p->mMediaInfo.program[0].duration;
break;
}
case METADATA_MEDIAINFO:
{
CdxMediaInfoT *mi = (CdxMediaInfoT *)pVal;
*mi = p->mMediaInfo;
break;
}
case METADATA_PARSER_TYPE:
{
int *type = (int*)pVal;
*type = p->mParser->type;
break;
}
default:
{
logw("unknown type: %d", type);
return -1;
}
}
return 0;
}
static int64_t GetSysTime()
{
int64_t time;
struct timeval t;
gettimeofday(&t, NULL);
time = (int64_t)t.tv_sec * 1000000;
time += t.tv_usec;
return time;
}
static int transformPicture(struct ScMemOpsS *memOps,
VideoPicture * pPicture,
XVideoFrame* pVideoFrame)
{
unsigned short* pDst;
unsigned char* pSrcY;
unsigned char* pSrcU;
unsigned char* pSrcV;
int y;
int x;
unsigned char* pClipTable;
unsigned char* pClip;
static const int nClipMin = -278;
static const int nClipMax = 535;
if((pPicture->ePixelFormat!= PIXEL_FORMAT_YV12) &&
(pPicture->ePixelFormat!= PIXEL_FORMAT_YUV_PLANER_420))
{
loge("source pixel format is not YV12, quit.");
return -1;
}
//* initialize the clip table.
pClipTable = (unsigned char*)malloc(nClipMax - nClipMin + 1);
if(pClipTable == NULL)
{
loge("can not allocate memory for the clip table, quit.");
return -1;
}
for(x=nClipMin; x<=nClipMax; x++)
{
pClipTable[x-nClipMin] = (x<0) ? 0 : (x>255) ? 255 : x;
}
pClip = &pClipTable[-nClipMin];
//* flush cache.
CdcMemFlushCache(memOps, pPicture->pData0, pPicture->nLineStride*pPicture->nHeight);
CdcMemFlushCache(memOps, pPicture->pData1, pPicture->nLineStride*pPicture->nHeight/4);
CdcMemFlushCache(memOps, pPicture->pData2, pPicture->nLineStride*pPicture->nHeight/4);
//* set pointers.
pDst = (unsigned short*)pVideoFrame->mData;
pSrcY = (unsigned char*)pPicture->pData0 + pPicture->nTopOffset * \
pPicture->nLineStride + pPicture->nLeftOffset;
if(pPicture->ePixelFormat== PIXEL_FORMAT_YV12)
{
pSrcV = (unsigned char*)pPicture->pData1 + (pPicture->nTopOffset/2) * \
(pPicture->nLineStride/2) + pPicture->nLeftOffset/2;
pSrcU = (unsigned char*)pPicture->pData2 + (pPicture->nTopOffset/2) * \
(pPicture->nLineStride/2) + pPicture->nLeftOffset/2;
}
else
{
pSrcU = (unsigned char*)pPicture->pData1 + (pPicture->nTopOffset/2) * \
(pPicture->nLineStride/2) + pPicture->nLeftOffset/2;
pSrcV = (unsigned char*)pPicture->pData2 + (pPicture->nTopOffset/2) * \
(pPicture->nLineStride/2) + pPicture->nLeftOffset/2;
}
for(y = 0; y < (int)pVideoFrame->mHeight; ++y)
{
for(x = 0; x < (int)pVideoFrame->mWidth; x += 2)
{
// B = 1.164 * (Y - 16) + 2.018 * (U - 128)
// G = 1.164 * (Y - 16) - 0.813 * (V - 128) - 0.391 * (U - 128)
// R = 1.164 * (Y - 16) + 1.596 * (V - 128)
// B = 298/256 * (Y - 16) + 517/256 * (U - 128)
// G = .................. - 208/256 * (V - 128) - 100/256 * (U - 128)
// R = .................. + 409/256 * (V - 128)
// min_B = (298 * (- 16) + 517 * (- 128)) / 256 = -277
// min_G = (298 * (- 16) - 208 * (255 - 128) - 100 * (255 - 128)) / 256 = -172
// min_R = (298 * (- 16) + 409 * (- 128)) / 256 = -223
// max_B = (298 * (255 - 16) + 517 * (255 - 128)) / 256 = 534
// max_G = (298 * (255 - 16) - 208 * (- 128) - 100 * (- 128)) / 256 = 432
// max_R = (298 * (255 - 16) + 409 * (255 - 128)) / 256 = 481
// clip range -278 .. 535
signed y1 = (signed)pSrcY[x] - 16;
signed y2 = (signed)pSrcY[x + 1] - 16;
signed u = (signed)pSrcU[x / 2] - 128;
signed v = (signed)pSrcV[x / 2] - 128;
signed u_b = u * 517;
signed u_g = -u * 100;
signed v_g = -v * 208;
signed v_r = v * 409;
signed tmp1 = y1 * 298;
signed b1 = (tmp1 + u_b) / 256;
signed g1 = (tmp1 + v_g + u_g) / 256;
signed r1 = (tmp1 + v_r) / 256;
signed tmp2 = y2 * 298;
signed b2 = (tmp2 + u_b) / 256;
signed g2 = (tmp2 + v_g + u_g) / 256;
signed r2 = (tmp2 + v_r) / 256;
unsigned int rgb1 = ((pClip[r1] >> 3) << 11) |
((pClip[g1] >> 2) << 5) |
(pClip[b1] >> 3);
unsigned int rgb2 = ((pClip[r2] >> 3) << 11) |
((pClip[g2] >> 2) << 5) |
(pClip[b2] >> 3);
*(unsigned int *)(&pDst[x]) = (rgb2 << 16) | rgb1;
}
pSrcY += pPicture->nLineStride;
if(y & 1)
{
pSrcU += pPicture->nLineStride / 2;
pSrcV += pPicture->nLineStride / 2;
}
pDst += pVideoFrame->mWidth;
}
free(pClipTable);
return 0;
}