872 lines
29 KiB
C
872 lines
29 KiB
C
/*
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*
|
|
* Based on code from the OggTheora software codec source code,
|
|
* Copyright (C) 2002-2010 The Xiph.Org Foundation and contributors.
|
|
*/
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include "y4minput.h"
|
|
|
|
static int y4m_parse_tags(y4m_input *_y4m,char *_tags){
|
|
int got_w;
|
|
int got_h;
|
|
int got_fps;
|
|
int got_interlace;
|
|
int got_par;
|
|
int got_chroma;
|
|
char *p;
|
|
char *q;
|
|
got_w=got_h=got_fps=got_interlace=got_par=got_chroma=0;
|
|
for(p=_tags;;p=q){
|
|
/*Skip any leading spaces.*/
|
|
while(*p==' ')p++;
|
|
/*If that's all we have, stop.*/
|
|
if(p[0]=='\0')break;
|
|
/*Find the end of this tag.*/
|
|
for(q=p+1;*q!='\0'&&*q!=' ';q++);
|
|
/*Process the tag.*/
|
|
switch(p[0]){
|
|
case 'W':{
|
|
if(sscanf(p+1,"%d",&_y4m->pic_w)!=1)return -1;
|
|
got_w=1;
|
|
}break;
|
|
case 'H':{
|
|
if(sscanf(p+1,"%d",&_y4m->pic_h)!=1)return -1;
|
|
got_h=1;
|
|
}break;
|
|
case 'F':{
|
|
if(sscanf(p+1,"%d:%d",&_y4m->fps_n,&_y4m->fps_d)!=2){
|
|
return -1;
|
|
}
|
|
got_fps=1;
|
|
}break;
|
|
case 'I':{
|
|
_y4m->interlace=p[1];
|
|
got_interlace=1;
|
|
}break;
|
|
case 'A':{
|
|
if(sscanf(p+1,"%d:%d",&_y4m->par_n,&_y4m->par_d)!=2){
|
|
return -1;
|
|
}
|
|
got_par=1;
|
|
}break;
|
|
case 'C':{
|
|
if(q-p>16)return -1;
|
|
memcpy(_y4m->chroma_type,p+1,q-p-1);
|
|
_y4m->chroma_type[q-p-1]='\0';
|
|
got_chroma=1;
|
|
}break;
|
|
/*Ignore unknown tags.*/
|
|
}
|
|
}
|
|
if(!got_w||!got_h||!got_fps)return -1;
|
|
if(!got_interlace)_y4m->interlace='?';
|
|
if(!got_par)_y4m->par_n=_y4m->par_d=0;
|
|
/*Chroma-type is not specified in older files, e.g., those generated by
|
|
mplayer.*/
|
|
if(!got_chroma)strcpy(_y4m->chroma_type,"420");
|
|
return 0;
|
|
}
|
|
|
|
|
|
|
|
/*All anti-aliasing filters in the following conversion functions are based on
|
|
one of two window functions:
|
|
The 6-tap Lanczos window (for down-sampling and shifts):
|
|
sinc(\pi*t)*sinc(\pi*t/3), |t|<3 (sinc(t)==sin(t)/t)
|
|
0, |t|>=3
|
|
The 4-tap Mitchell window (for up-sampling):
|
|
7|t|^3-12|t|^2+16/3, |t|<1
|
|
-(7/3)|x|^3+12|x|^2-20|x|+32/3, |t|<2
|
|
0, |t|>=2
|
|
The number of taps is intentionally kept small to reduce computational
|
|
overhead and limit ringing.
|
|
|
|
The taps from these filters are scaled so that their sum is 1, and the result
|
|
is scaled by 128 and rounded to integers to create a filter whose
|
|
intermediate values fit inside 16 bits.
|
|
Coefficients are rounded in such a way as to ensure their sum is still 128,
|
|
which is usually equivalent to normal rounding.
|
|
|
|
Conversions which require both horizontal and vertical filtering could
|
|
have these steps pipelined, for less memory consumption and better cache
|
|
performance, but we do them separately for simplicity.*/
|
|
|
|
#define OC_MINI(_a,_b) ((_a)>(_b)?(_b):(_a))
|
|
#define OC_MAXI(_a,_b) ((_a)<(_b)?(_b):(_a))
|
|
#define OC_CLAMPI(_a,_b,_c) (OC_MAXI(_a,OC_MINI(_b,_c)))
|
|
|
|
/*420jpeg chroma samples are sited like:
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
420mpeg2 chroma samples are sited like:
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
BR | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
BR | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
We use a resampling filter to shift the site locations one quarter pixel (at
|
|
the chroma plane's resolution) to the right.
|
|
The 4:2:2 modes look exactly the same, except there are twice as many chroma
|
|
lines, and they are vertically co-sited with the luma samples in both the
|
|
mpeg2 and jpeg cases (thus requiring no vertical resampling).*/
|
|
static void y4m_42xmpeg2_42xjpeg_helper(unsigned char *_dst,
|
|
const unsigned char *_src,int _c_w,int _c_h){
|
|
int y;
|
|
int x;
|
|
for(y=0;y<_c_h;y++){
|
|
/*Filter: [4 -17 114 35 -9 1]/128, derived from a 6-tap Lanczos
|
|
window.*/
|
|
for(x=0;x<OC_MINI(_c_w,2);x++){
|
|
_dst[x]=(unsigned char)OC_CLAMPI(0,(4*_src[0]-17*_src[OC_MAXI(x-1,0)]+
|
|
114*_src[x]+35*_src[OC_MINI(x+1,_c_w-1)]-9*_src[OC_MINI(x+2,_c_w-1)]+
|
|
_src[OC_MINI(x+3,_c_w-1)]+64)>>7,255);
|
|
}
|
|
for(;x<_c_w-3;x++){
|
|
_dst[x]=(unsigned char)OC_CLAMPI(0,(4*_src[x-2]-17*_src[x-1]+
|
|
114*_src[x]+35*_src[x+1]-9*_src[x+2]+_src[x+3]+64)>>7,255);
|
|
}
|
|
for(;x<_c_w;x++){
|
|
_dst[x]=(unsigned char)OC_CLAMPI(0,(4*_src[x-2]-17*_src[x-1]+
|
|
114*_src[x]+35*_src[OC_MINI(x+1,_c_w-1)]-9*_src[OC_MINI(x+2,_c_w-1)]+
|
|
_src[_c_w-1]+64)>>7,255);
|
|
}
|
|
_dst+=_c_w;
|
|
_src+=_c_w;
|
|
}
|
|
}
|
|
|
|
/*Handles both 422 and 420mpeg2 to 422jpeg and 420jpeg, respectively.*/
|
|
static void y4m_convert_42xmpeg2_42xjpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int pli;
|
|
/*Skip past the luma data.*/
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
/*Compute the size of each chroma plane.*/
|
|
c_w=(_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h;
|
|
c_h=(_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v;
|
|
c_sz=c_w*c_h;
|
|
for(pli=1;pli<3;pli++){
|
|
y4m_42xmpeg2_42xjpeg_helper(_dst,_aux,c_w,c_h);
|
|
_dst+=c_sz;
|
|
_aux+=c_sz;
|
|
}
|
|
}
|
|
|
|
/*This format is only used for interlaced content, but is included for
|
|
completeness.
|
|
|
|
420jpeg chroma samples are sited like:
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
420paldv chroma samples are sited like:
|
|
YR------Y-------YR------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YB------Y-------YB------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YR------Y-------YR------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YB------Y-------YB------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
We use a resampling filter to shift the site locations one quarter pixel (at
|
|
the chroma plane's resolution) to the right.
|
|
Then we use another filter to move the C_r location down one quarter pixel,
|
|
and the C_b location up one quarter pixel.*/
|
|
static void y4m_convert_42xpaldv_42xjpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
unsigned char *tmp;
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int pli;
|
|
int y;
|
|
int x;
|
|
/*Skip past the luma data.*/
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
/*Compute the size of each chroma plane.*/
|
|
c_w=(_y4m->pic_w+1)/2;
|
|
c_h=(_y4m->pic_h+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h;
|
|
c_sz=c_w*c_h;
|
|
tmp=_aux+2*c_sz;
|
|
for(pli=1;pli<3;pli++){
|
|
/*First do the horizontal re-sampling.
|
|
This is the same as the mpeg2 case, except that after the horizontal
|
|
case, we need to apply a second vertical filter.*/
|
|
y4m_42xmpeg2_42xjpeg_helper(tmp,_aux,c_w,c_h);
|
|
_aux+=c_sz;
|
|
switch(pli){
|
|
case 1:{
|
|
/*Slide C_b up a quarter-pel.
|
|
This is the same filter used above, but in the other order.*/
|
|
for(x=0;x<c_w;x++){
|
|
for(y=0;y<OC_MINI(c_h,3);y++){
|
|
_dst[y*c_w]=(unsigned char)OC_CLAMPI(0,(tmp[0]
|
|
-9*tmp[OC_MAXI(y-2,0)*c_w]+35*tmp[OC_MAXI(y-1,0)*c_w]
|
|
+114*tmp[y*c_w]-17*tmp[OC_MINI(y+1,c_h-1)*c_w]
|
|
+4*tmp[OC_MINI(y+2,c_h-1)*c_w]+64)>>7,255);
|
|
}
|
|
for(;y<c_h-2;y++){
|
|
_dst[y*c_w]=(unsigned char)OC_CLAMPI(0,(tmp[(y-3)*c_w]
|
|
-9*tmp[(y-2)*c_w]+35*tmp[(y-1)*c_w]+114*tmp[y*c_w]
|
|
-17*tmp[(y+1)*c_w]+4*tmp[(y+2)*c_w]+64)>>7,255);
|
|
}
|
|
for(;y<c_h;y++){
|
|
_dst[y*c_w]=(unsigned char)OC_CLAMPI(0,(tmp[(y-3)*c_w]
|
|
-9*tmp[(y-2)*c_w]+35*tmp[(y-1)*c_w]+114*tmp[y*c_w]
|
|
-17*tmp[OC_MINI(y+1,c_h-1)*c_w]+4*tmp[(c_h-1)*c_w]+64)>>7,255);
|
|
}
|
|
_dst++;
|
|
tmp++;
|
|
}
|
|
_dst+=c_sz-c_w;
|
|
tmp-=c_w;
|
|
}break;
|
|
case 2:{
|
|
/*Slide C_r down a quarter-pel.
|
|
This is the same as the horizontal filter.*/
|
|
for(x=0;x<c_w;x++){
|
|
for(y=0;y<OC_MINI(c_h,2);y++){
|
|
_dst[y*c_w]=(unsigned char)OC_CLAMPI(0,(4*tmp[0]
|
|
-17*tmp[OC_MAXI(y-1,0)*c_w]+114*tmp[y*c_w]
|
|
+35*tmp[OC_MINI(y+1,c_h-1)*c_w]-9*tmp[OC_MINI(y+2,c_h-1)*c_w]
|
|
+tmp[OC_MINI(y+3,c_h-1)*c_w]+64)>>7,255);
|
|
}
|
|
for(;y<c_h-3;y++){
|
|
_dst[y*c_w]=(unsigned char)OC_CLAMPI(0,(4*tmp[(y-2)*c_w]
|
|
-17*tmp[(y-1)*c_w]+114*tmp[y*c_w]+35*tmp[(y+1)*c_w]
|
|
-9*tmp[(y+2)*c_w]+tmp[(y+3)*c_w]+64)>>7,255);
|
|
}
|
|
for(;y<c_h;y++){
|
|
_dst[y*c_w]=(unsigned char)OC_CLAMPI(0,(4*tmp[(y-2)*c_w]
|
|
-17*tmp[(y-1)*c_w]+114*tmp[y*c_w]+35*tmp[OC_MINI(y+1,c_h-1)*c_w]
|
|
-9*tmp[OC_MINI(y+2,c_h-1)*c_w]+tmp[(c_h-1)*c_w]+64)>>7,255);
|
|
}
|
|
_dst++;
|
|
tmp++;
|
|
}
|
|
}break;
|
|
}
|
|
/*For actual interlaced material, this would have to be done separately on
|
|
each field, and the shift amounts would be different.
|
|
C_r moves down 1/8, C_b up 3/8 in the top field, and C_r moves down 3/8,
|
|
C_b up 1/8 in the bottom field.
|
|
The corresponding filters would be:
|
|
Down 1/8 (reverse order for up): [3 -11 125 15 -4 0]/128
|
|
Down 3/8 (reverse order for up): [4 -19 98 56 -13 2]/128*/
|
|
}
|
|
}
|
|
|
|
/*Perform vertical filtering to reduce a single plane from 4:2:2 to 4:2:0.
|
|
This is used as a helper by several converation routines.*/
|
|
static void y4m_422jpeg_420jpeg_helper(unsigned char *_dst,
|
|
const unsigned char *_src,int _c_w,int _c_h){
|
|
int y;
|
|
int x;
|
|
/*Filter: [3 -17 78 78 -17 3]/128, derived from a 6-tap Lanczos window.*/
|
|
for(x=0;x<_c_w;x++){
|
|
for(y=0;y<OC_MINI(_c_h,2);y+=2){
|
|
_dst[(y>>1)*_c_w]=OC_CLAMPI(0,(64*_src[0]
|
|
+78*_src[OC_MINI(1,_c_h-1)*_c_w]
|
|
-17*_src[OC_MINI(2,_c_h-1)*_c_w]
|
|
+3*_src[OC_MINI(3,_c_h-1)*_c_w]+64)>>7,255);
|
|
}
|
|
for(;y<_c_h-3;y+=2){
|
|
_dst[(y>>1)*_c_w]=OC_CLAMPI(0,(3*(_src[(y-2)*_c_w]+_src[(y+3)*_c_w])
|
|
-17*(_src[(y-1)*_c_w]+_src[(y+2)*_c_w])
|
|
+78*(_src[y*_c_w]+_src[(y+1)*_c_w])+64)>>7,255);
|
|
}
|
|
for(;y<_c_h;y+=2){
|
|
_dst[(y>>1)*_c_w]=OC_CLAMPI(0,(3*(_src[(y-2)*_c_w]
|
|
+_src[(_c_h-1)*_c_w])-17*(_src[(y-1)*_c_w]
|
|
+_src[OC_MINI(y+2,_c_h-1)*_c_w])
|
|
+78*(_src[y*_c_w]+_src[OC_MINI(y+1,_c_h-1)*_c_w])+64)>>7,255);
|
|
}
|
|
_src++;
|
|
_dst++;
|
|
}
|
|
}
|
|
|
|
/*420jpeg chroma samples are sited like:
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
422jpeg chroma samples are sited like:
|
|
Y---BR--Y-------Y---BR--Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y---BR--Y-------Y---BR--Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y---BR--Y-------Y---BR--Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y---BR--Y-------Y---BR--Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
We use a resampling filter to decimate the chroma planes by two in the
|
|
vertical direction.*/
|
|
static void y4m_convert_422jpeg_420jpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int dst_c_w;
|
|
int dst_c_h;
|
|
int dst_c_sz;
|
|
int pli;
|
|
/*Skip past the luma data.*/
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
/*Compute the size of each chroma plane.*/
|
|
c_w=(_y4m->pic_w+_y4m->src_c_dec_h-1)/_y4m->src_c_dec_h;
|
|
c_h=_y4m->pic_h;
|
|
dst_c_w=(_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h;
|
|
dst_c_h=(_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v;
|
|
c_sz=c_w*c_h;
|
|
dst_c_sz=dst_c_w*dst_c_h;
|
|
for(pli=1;pli<3;pli++){
|
|
y4m_422jpeg_420jpeg_helper(_dst,_aux,c_w,c_h);
|
|
_aux+=c_sz;
|
|
_dst+=dst_c_sz;
|
|
}
|
|
}
|
|
|
|
/*420jpeg chroma samples are sited like:
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
422 chroma samples are sited like:
|
|
YBR-----Y-------YBR-----Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YBR-----Y-------YBR-----Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YBR-----Y-------YBR-----Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YBR-----Y-------YBR-----Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
We use a resampling filter to shift the original site locations one quarter
|
|
pixel (at the original chroma resolution) to the right.
|
|
Then we use a second resampling filter to decimate the chroma planes by two
|
|
in the vertical direction.*/
|
|
static void y4m_convert_422_420jpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
unsigned char *tmp;
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int dst_c_h;
|
|
int dst_c_sz;
|
|
int pli;
|
|
/*Skip past the luma data.*/
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
/*Compute the size of each chroma plane.*/
|
|
c_w=(_y4m->pic_w+_y4m->src_c_dec_h-1)/_y4m->src_c_dec_h;
|
|
c_h=_y4m->pic_h;
|
|
dst_c_h=(_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v;
|
|
c_sz=c_w*c_h;
|
|
dst_c_sz=c_w*dst_c_h;
|
|
tmp=_aux+2*c_sz;
|
|
for(pli=1;pli<3;pli++){
|
|
/*In reality, the horizontal and vertical steps could be pipelined, for
|
|
less memory consumption and better cache performance, but we do them
|
|
separately for simplicity.*/
|
|
/*First do horizontal filtering (convert to 422jpeg)*/
|
|
y4m_42xmpeg2_42xjpeg_helper(tmp,_aux,c_w,c_h);
|
|
/*Now do the vertical filtering.*/
|
|
y4m_422jpeg_420jpeg_helper(_dst,tmp,c_w,c_h);
|
|
_aux+=c_sz;
|
|
_dst+=dst_c_sz;
|
|
}
|
|
}
|
|
|
|
/*420jpeg chroma samples are sited like:
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| BR | | BR |
|
|
| | | |
|
|
Y-------Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
411 chroma samples are sited like:
|
|
YBR-----Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YBR-----Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YBR-----Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
YBR-----Y-------Y-------Y-------
|
|
| | | |
|
|
| | | |
|
|
| | | |
|
|
|
|
We use a filter to resample at site locations one eighth pixel (at the source
|
|
chroma plane's horizontal resolution) and five eighths of a pixel to the
|
|
right.
|
|
Then we use another filter to decimate the planes by 2 in the vertical
|
|
direction.*/
|
|
static void y4m_convert_411_420jpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
unsigned char *tmp;
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int dst_c_w;
|
|
int dst_c_h;
|
|
int dst_c_sz;
|
|
int tmp_sz;
|
|
int pli;
|
|
int y;
|
|
int x;
|
|
/*Skip past the luma data.*/
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
/*Compute the size of each chroma plane.*/
|
|
c_w=(_y4m->pic_w+_y4m->src_c_dec_h-1)/_y4m->src_c_dec_h;
|
|
c_h=_y4m->pic_h;
|
|
dst_c_w=(_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h;
|
|
dst_c_h=(_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v;
|
|
c_sz=c_w*c_h;
|
|
dst_c_sz=dst_c_w*dst_c_h;
|
|
tmp_sz=dst_c_w*c_h;
|
|
tmp=_aux+2*c_sz;
|
|
for(pli=1;pli<3;pli++){
|
|
/*In reality, the horizontal and vertical steps could be pipelined, for
|
|
less memory consumption and better cache performance, but we do them
|
|
separately for simplicity.*/
|
|
/*First do horizontal filtering (convert to 422jpeg)*/
|
|
for(y=0;y<c_h;y++){
|
|
/*Filters: [1 110 18 -1]/128 and [-3 50 86 -5]/128, both derived from a
|
|
4-tap Mitchell window.*/
|
|
for(x=0;x<OC_MINI(c_w,1);x++){
|
|
tmp[x<<1]=(unsigned char)OC_CLAMPI(0,(111*_aux[0]
|
|
+18*_aux[OC_MINI(1,c_w-1)]-_aux[OC_MINI(2,c_w-1)]+64)>>7,255);
|
|
tmp[x<<1|1]=(unsigned char)OC_CLAMPI(0,(47*_aux[0]
|
|
+86*_aux[OC_MINI(1,c_w-1)]-5*_aux[OC_MINI(2,c_w-1)]+64)>>7,255);
|
|
}
|
|
for(;x<c_w-2;x++){
|
|
tmp[x<<1]=(unsigned char)OC_CLAMPI(0,(_aux[x-1]+110*_aux[x]
|
|
+18*_aux[x+1]-_aux[x+2]+64)>>7,255);
|
|
tmp[x<<1|1]=(unsigned char)OC_CLAMPI(0,(-3*_aux[x-1]+50*_aux[x]
|
|
+86*_aux[x+1]-5*_aux[x+2]+64)>>7,255);
|
|
}
|
|
for(;x<c_w;x++){
|
|
tmp[x<<1]=(unsigned char)OC_CLAMPI(0,(_aux[x-1]+110*_aux[x]
|
|
+18*_aux[OC_MINI(x+1,c_w-1)]-_aux[c_w-1]+64)>>7,255);
|
|
if((x<<1|1)<dst_c_w){
|
|
tmp[x<<1|1]=(unsigned char)OC_CLAMPI(0,(-3*_aux[x-1]+50*_aux[x]
|
|
+86*_aux[OC_MINI(x+1,c_w-1)]-5*_aux[c_w-1]+64)>>7,255);
|
|
}
|
|
}
|
|
tmp+=dst_c_w;
|
|
_aux+=c_w;
|
|
}
|
|
tmp-=tmp_sz;
|
|
/*Now do the vertical filtering.*/
|
|
y4m_422jpeg_420jpeg_helper(_dst,tmp,dst_c_w,c_h);
|
|
_dst+=dst_c_sz;
|
|
}
|
|
}
|
|
|
|
/*Convert 444 to 420jpeg.*/
|
|
static void y4m_convert_444_420jpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
unsigned char *tmp;
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int dst_c_w;
|
|
int dst_c_h;
|
|
int dst_c_sz;
|
|
int tmp_sz;
|
|
int pli;
|
|
int y;
|
|
int x;
|
|
/*Skip past the luma data.*/
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
/*Compute the size of each chroma plane.*/
|
|
c_w=(_y4m->pic_w+_y4m->src_c_dec_h-1)/_y4m->src_c_dec_h;
|
|
c_h=_y4m->pic_h;
|
|
dst_c_w=(_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h;
|
|
dst_c_h=(_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v;
|
|
c_sz=c_w*c_h;
|
|
dst_c_sz=dst_c_w*dst_c_h;
|
|
tmp_sz=dst_c_w*c_h;
|
|
tmp=_aux+2*c_sz;
|
|
for(pli=1;pli<3;pli++){
|
|
/*Filter: [3 -17 78 78 -17 3]/128, derived from a 6-tap Lanczos window.*/
|
|
for(y=0;y<c_h;y++){
|
|
for(x=0;x<OC_MINI(c_w,2);x+=2){
|
|
tmp[x>>1]=OC_CLAMPI(0,(64*_aux[0]+78*_aux[OC_MINI(1,c_w-1)]
|
|
-17*_aux[OC_MINI(2,c_w-1)]
|
|
+3*_aux[OC_MINI(3,c_w-1)]+64)>>7,255);
|
|
}
|
|
for(;x<c_w-3;x+=2){
|
|
tmp[x>>1]=OC_CLAMPI(0,(3*(_aux[x-2]+_aux[x+3])
|
|
-17*(_aux[x-1]+_aux[x+2])+78*(_aux[x]+_aux[x+1])+64)>>7,255);
|
|
}
|
|
for(;x<c_w;x+=2){
|
|
tmp[x>>1]=OC_CLAMPI(0,(3*(_aux[x-2]+_aux[c_w-1])-
|
|
17*(_aux[x-1]+_aux[OC_MINI(x+2,c_w-1)])+
|
|
78*(_aux[x]+_aux[OC_MINI(x+1,c_w-1)])+64)>>7,255);
|
|
}
|
|
tmp+=dst_c_w;
|
|
_aux+=c_w;
|
|
}
|
|
tmp-=tmp_sz;
|
|
/*Now do the vertical filtering.*/
|
|
y4m_422jpeg_420jpeg_helper(_dst,tmp,dst_c_w,c_h);
|
|
_dst+=dst_c_sz;
|
|
}
|
|
}
|
|
|
|
/*The image is padded with empty chroma components at 4:2:0.*/
|
|
static void y4m_convert_mono_420jpeg(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
int c_sz;
|
|
_dst+=_y4m->pic_w*_y4m->pic_h;
|
|
c_sz=((_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h)*
|
|
((_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v);
|
|
memset(_dst,128,c_sz*2);
|
|
}
|
|
|
|
/*No conversion function needed.*/
|
|
static void y4m_convert_null(y4m_input *_y4m,unsigned char *_dst,
|
|
unsigned char *_aux){
|
|
}
|
|
|
|
int y4m_input_open(y4m_input *_y4m,FILE *_fin,char *_skip,int _nskip){
|
|
char buffer[80];
|
|
int ret;
|
|
int i;
|
|
/*Read until newline, or 80 cols, whichever happens first.*/
|
|
for(i=0;i<79;i++){
|
|
if(_nskip>0){
|
|
buffer[i]=*_skip++;
|
|
_nskip--;
|
|
}
|
|
else{
|
|
ret=fread(buffer+i,1,1,_fin);
|
|
if(ret<1)return -1;
|
|
}
|
|
if(buffer[i]=='\n')break;
|
|
}
|
|
/*We skipped too much header data.*/
|
|
if(_nskip>0)return -1;
|
|
if(i==79){
|
|
fprintf(stderr,"Error parsing header; not a YUV2MPEG2 file?\n");
|
|
return -1;
|
|
}
|
|
buffer[i]='\0';
|
|
if(memcmp(buffer,"YUV4MPEG",8)){
|
|
fprintf(stderr,"Incomplete magic for YUV4MPEG file.\n");
|
|
return -1;
|
|
}
|
|
if(buffer[8]!='2'){
|
|
fprintf(stderr,"Incorrect YUV input file version; YUV4MPEG2 required.\n");
|
|
}
|
|
ret=y4m_parse_tags(_y4m,buffer+5);
|
|
if(ret<0){
|
|
fprintf(stderr,"Error parsing YUV4MPEG2 header.\n");
|
|
return ret;
|
|
}
|
|
if(_y4m->interlace=='?'){
|
|
fprintf(stderr,"Warning: Input video interlacing format unknown; "
|
|
"assuming progressive scan.\n");
|
|
}
|
|
else if(_y4m->interlace!='p'){
|
|
fprintf(stderr,"Input video is interlaced; "
|
|
"Only progressive scan handled.\n");
|
|
return -1;
|
|
}
|
|
if(strcmp(_y4m->chroma_type,"420")==0||
|
|
strcmp(_y4m->chroma_type,"420jpeg")==0){
|
|
_y4m->src_c_dec_h=_y4m->dst_c_dec_h=_y4m->src_c_dec_v=_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h
|
|
+2*((_y4m->pic_w+1)/2)*((_y4m->pic_h+1)/2);
|
|
/*Natively supported: no conversion required.*/
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz=0;
|
|
_y4m->convert=y4m_convert_null;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"420mpeg2")==0){
|
|
_y4m->src_c_dec_h=_y4m->dst_c_dec_h=_y4m->src_c_dec_v=_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.*/
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz=
|
|
2*((_y4m->pic_w+1)/2)*((_y4m->pic_h+1)/2);
|
|
_y4m->convert=y4m_convert_42xmpeg2_42xjpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"420paldv")==0){
|
|
_y4m->src_c_dec_h=_y4m->dst_c_dec_h=_y4m->src_c_dec_v=_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.
|
|
We need to make two filter passes, so we need some extra space in the
|
|
aux buffer.*/
|
|
_y4m->aux_buf_sz=3*((_y4m->pic_w+1)/2)*((_y4m->pic_h+1)/2);
|
|
_y4m->aux_buf_read_sz=2*((_y4m->pic_w+1)/2)*((_y4m->pic_h+1)/2);
|
|
_y4m->convert=y4m_convert_42xpaldv_42xjpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"422jpeg")==0){
|
|
_y4m->src_c_dec_h=_y4m->dst_c_dec_h=2;
|
|
_y4m->src_c_dec_v=1;
|
|
_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.*/
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz=2*((_y4m->pic_w+1)/2)*_y4m->pic_h;
|
|
_y4m->convert=y4m_convert_422jpeg_420jpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"422")==0){
|
|
_y4m->src_c_dec_h=_y4m->dst_c_dec_h=2;
|
|
_y4m->src_c_dec_v=1;
|
|
_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.
|
|
We need to make two filter passes, so we need some extra space in the
|
|
aux buffer.*/
|
|
_y4m->aux_buf_read_sz=2*((_y4m->pic_w+1)/2)*_y4m->pic_h;
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz+((_y4m->pic_w+1)/2)*_y4m->pic_h;
|
|
_y4m->convert=y4m_convert_422_420jpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"411")==0){
|
|
_y4m->src_c_dec_h=4;
|
|
_y4m->dst_c_dec_h=2;
|
|
_y4m->src_c_dec_v=1;
|
|
_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.
|
|
We need to make two filter passes, so we need some extra space in the
|
|
aux buffer.*/
|
|
_y4m->aux_buf_read_sz=2*((_y4m->pic_w+3)/4)*_y4m->pic_h;
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz+((_y4m->pic_w+1)/2)*_y4m->pic_h;
|
|
_y4m->convert=y4m_convert_411_420jpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"444")==0){
|
|
_y4m->src_c_dec_h=1;
|
|
_y4m->dst_c_dec_h=2;
|
|
_y4m->src_c_dec_v=1;
|
|
_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.
|
|
We need to make two filter passes, so we need some extra space in the
|
|
aux buffer.*/
|
|
_y4m->aux_buf_read_sz=2*_y4m->pic_w*_y4m->pic_h;
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz+((_y4m->pic_w+1)/2)*_y4m->pic_h;
|
|
_y4m->convert=y4m_convert_444_420jpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"444alpha")==0){
|
|
_y4m->src_c_dec_h=1;
|
|
_y4m->dst_c_dec_h=2;
|
|
_y4m->src_c_dec_v=1;
|
|
_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*Chroma filter required: read into the aux buf first.
|
|
We need to make two filter passes, so we need some extra space in the
|
|
aux buffer.
|
|
The extra plane also gets read into the aux buf.
|
|
It will be discarded.*/
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz=3*_y4m->pic_w*_y4m->pic_h;
|
|
_y4m->convert=y4m_convert_444_420jpeg;
|
|
}
|
|
else if(strcmp(_y4m->chroma_type,"mono")==0){
|
|
_y4m->src_c_dec_h=_y4m->src_c_dec_v=0;
|
|
_y4m->dst_c_dec_h=_y4m->dst_c_dec_v=2;
|
|
_y4m->dst_buf_read_sz=_y4m->pic_w*_y4m->pic_h;
|
|
/*No extra space required, but we need to clear the chroma planes.*/
|
|
_y4m->aux_buf_sz=_y4m->aux_buf_read_sz=0;
|
|
_y4m->convert=y4m_convert_mono_420jpeg;
|
|
}
|
|
else{
|
|
fprintf(stderr,"Unknown chroma sampling type: %s\n",_y4m->chroma_type);
|
|
return -1;
|
|
}
|
|
/*The size of the final frame buffers is always computed from the
|
|
destination chroma decimation type.*/
|
|
_y4m->dst_buf_sz=_y4m->pic_w*_y4m->pic_h
|
|
+2*((_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h)*
|
|
((_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v);
|
|
_y4m->dst_buf=(unsigned char *)malloc(_y4m->dst_buf_sz);
|
|
_y4m->aux_buf=(unsigned char *)malloc(_y4m->aux_buf_sz);
|
|
return 0;
|
|
}
|
|
|
|
void y4m_input_close(y4m_input *_y4m){
|
|
free(_y4m->dst_buf);
|
|
free(_y4m->aux_buf);
|
|
}
|
|
|
|
int y4m_input_fetch_frame(y4m_input *_y4m,FILE *_fin,vpx_image_t *_img){
|
|
char frame[6];
|
|
int pic_sz;
|
|
int c_w;
|
|
int c_h;
|
|
int c_sz;
|
|
int ret;
|
|
/*Read and skip the frame header.*/
|
|
ret=fread(frame,1,6,_fin);
|
|
if(ret<6)return 0;
|
|
if(memcmp(frame,"FRAME",5)){
|
|
fprintf(stderr,"Loss of framing in Y4M input data\n");
|
|
return -1;
|
|
}
|
|
if(frame[5]!='\n'){
|
|
char c;
|
|
int j;
|
|
for(j=0;j<79&&fread(&c,1,1,_fin)&&c!='\n';j++);
|
|
if(j==79){
|
|
fprintf(stderr,"Error parsing Y4M frame header\n");
|
|
return -1;
|
|
}
|
|
}
|
|
/*Read the frame data that needs no conversion.*/
|
|
if(fread(_y4m->dst_buf,1,_y4m->dst_buf_read_sz,_fin)!=_y4m->dst_buf_read_sz){
|
|
fprintf(stderr,"Error reading Y4M frame data.\n");
|
|
return -1;
|
|
}
|
|
/*Read the frame data that does need conversion.*/
|
|
if(fread(_y4m->aux_buf,1,_y4m->aux_buf_read_sz,_fin)!=_y4m->aux_buf_read_sz){
|
|
fprintf(stderr,"Error reading Y4M frame data.\n");
|
|
return -1;
|
|
}
|
|
/*Now convert the just read frame.*/
|
|
(*_y4m->convert)(_y4m,_y4m->dst_buf,_y4m->aux_buf);
|
|
/*Fill in the frame buffer pointers.
|
|
We don't use vpx_img_wrap() because it forces padding for odd picture
|
|
sizes, which would require a separate fread call for every row.*/
|
|
memset(_img,0,sizeof(*_img));
|
|
/*Y4M has the planes in Y'CbCr order, which libvpx calls Y, U, and V.*/
|
|
_img->fmt=IMG_FMT_I420;
|
|
_img->w=_img->d_w=_y4m->pic_w;
|
|
_img->h=_img->d_h=_y4m->pic_h;
|
|
/*This is hard-coded to 4:2:0 for now, as that's all VP8 supports.*/
|
|
_img->x_chroma_shift=1;
|
|
_img->y_chroma_shift=1;
|
|
_img->bps=12;
|
|
/*Set up the buffer pointers.*/
|
|
pic_sz=_y4m->pic_w*_y4m->pic_h;
|
|
c_w=(_y4m->pic_w+_y4m->dst_c_dec_h-1)/_y4m->dst_c_dec_h;
|
|
c_h=(_y4m->pic_h+_y4m->dst_c_dec_v-1)/_y4m->dst_c_dec_v;
|
|
c_sz=c_w*c_h;
|
|
_img->stride[PLANE_Y]=_y4m->pic_w;
|
|
_img->stride[PLANE_U]=_img->stride[PLANE_V]=c_w;
|
|
_img->planes[PLANE_Y]=_y4m->dst_buf;
|
|
_img->planes[PLANE_U]=_y4m->dst_buf+pic_sz;
|
|
_img->planes[PLANE_V]=_y4m->dst_buf+pic_sz+c_sz;
|
|
return 1;
|
|
}
|