~ubuntu-dev/mplayer/ubuntu-feisty

int sws_setColorspaceDetails(SwsContext *c, const int inv_table[4], int srcRange, const int table[4], int dstRange, int brightness, int contrast, int saturation){

1757

int64_t crv = inv_table[0];

1758

int64_t cbu = inv_table[1];

1759

int64_t cgu = -inv_table[2];

1760

int64_t cgv = -inv_table[3];

1761

int64_t cy = 1<<16;

1762

int64_t oy = 0;

1763

1764

if(isYUV(c->dstFormat) || isGray(c->dstFormat)) return -1;

1765

memcpy(c->srcColorspaceTable, inv_table, sizeof(int)*4);

1766

memcpy(c->dstColorspaceTable, table, sizeof(int)*4);

1767

1768

c->brightness= brightness;

1769

c->contrast = contrast;

1770

c->saturation= saturation;

1771

c->srcRange = srcRange;

1772

c->dstRange = dstRange;

1773

1774

c->uOffset= 0x0400040004000400LL;

1775

c->vOffset= 0x0400040004000400LL;

1776

1777

if(!srcRange){

1778

cy= (cy*255) / 219;

1779

oy= 16<<16;

1780

}

1781

1782

cy = (cy *contrast )>>16;

1783

crv= (crv*contrast * saturation)>>32;

1784

cbu= (cbu*contrast * saturation)>>32;

1785

cgu= (cgu*contrast * saturation)>>32;

1786

cgv= (cgv*contrast * saturation)>>32;

1787

1788

oy -= 256*brightness;

1789

1790

c->yCoeff= roundToInt16(cy *8192) * 0x0001000100010001ULL;

1791

c->vrCoeff= roundToInt16(crv*8192) * 0x0001000100010001ULL;

1792

c->ubCoeff= roundToInt16(cbu*8192) * 0x0001000100010001ULL;

1793

c->vgCoeff= roundToInt16(cgv*8192) * 0x0001000100010001ULL;

1794

c->ugCoeff= roundToInt16(cgu*8192) * 0x0001000100010001ULL;

1795

c->yOffset= roundToInt16(oy * 8) * 0x0001000100010001ULL;

1796

1797

yuv2rgb_c_init_tables(c, inv_table, srcRange, brightness, contrast, saturation);

1798

//FIXME factorize

1799

1800

#ifdef COMPILE_ALTIVEC

1801

if (c->flags & SWS_CPU_CAPS_ALTIVEC)

1802

yuv2rgb_altivec_init_tables (c, inv_table, brightness, contrast, saturation);

1803

#endif

1804

return 0;

1805

}

1806

1807

/**

1808

* @return -1 if not supported

1809

1810

int sws_getColorspaceDetails(SwsContext *c, int **inv_table, int *srcRange, int **table, int *dstRange, int *brightness, int *contrast, int *saturation){

1811

if(isYUV(c->dstFormat) || isGray(c->dstFormat)) return -1;

1812

1813

*inv_table = c->srcColorspaceTable;

1814

*table = c->dstColorspaceTable;

1815

*srcRange = c->srcRange;

1816

*dstRange = c->dstRange;

1817

*brightness= c->brightness;

1818

*contrast = c->contrast;

1819

*saturation= c->saturation;

1820

1821

return 0;

1822

}

1823

1824

SwsContext *sws_getContext(int srcW, int srcH, int origSrcFormat, int dstW, int dstH, int origDstFormat, int flags,

1825

SwsFilter *srcFilter, SwsFilter *dstFilter, double *param){

1826

1827

SwsContext *c;

1828

int i;

1829

int usesVFilter, usesHFilter;

1830

int unscaled, needsDither;

1831

int srcFormat, dstFormat;

1832

SwsFilter dummyFilter= {NULL, NULL, NULL, NULL};

1833

#if defined(ARCH_X86) || defined(ARCH_X86_64)

1834

if(flags & SWS_CPU_CAPS_MMX)

1835

asm volatile("emms\n\t"::: "memory");

1836

#endif

1837

1838

#ifndef RUNTIME_CPUDETECT //ensure that the flags match the compiled variant if cpudetect is off

1839

flags &= ~(SWS_CPU_CAPS_MMX|SWS_CPU_CAPS_MMX2|SWS_CPU_CAPS_3DNOW|SWS_CPU_CAPS_ALTIVEC);

1840

#ifdef HAVE_MMX2

1841

flags |= SWS_CPU_CAPS_MMX|SWS_CPU_CAPS_MMX2;

1842

#elif defined (HAVE_3DNOW)

1843

flags |= SWS_CPU_CAPS_MMX|SWS_CPU_CAPS_3DNOW;

1844

#elif defined (HAVE_MMX)

1845

flags |= SWS_CPU_CAPS_MMX;

1846

#elif defined (HAVE_ALTIVEC)

1847

flags |= SWS_CPU_CAPS_ALTIVEC;

1848

#endif

1849

#endif

1850

if(clip_table[512] != 255) globalInit();

1851

if(rgb15to16 == NULL) sws_rgb2rgb_init(flags);

1852

1853

/* avoid duplicate Formats, so we don't need to check to much */

1854

srcFormat = remove_dup_fourcc(origSrcFormat);

1855

dstFormat = remove_dup_fourcc(origDstFormat);

1856

1857

unscaled = (srcW == dstW && srcH == dstH);

1858

needsDither= (isBGR(dstFormat) || isRGB(dstFormat))

1859

&& (dstFormat&0xFF)<24

1860

&& ((dstFormat&0xFF)<(srcFormat&0xFF) || (!(isRGB(srcFormat) || isBGR(srcFormat))));

1861

1862

if(!isSupportedIn(srcFormat))

1863

{

1864

MSG_ERR("swScaler: %s is not supported as input format\n", vo_format_name(srcFormat));

1865

return NULL;

1866

}

1867

if(!isSupportedOut(dstFormat))

1868

{

1869

MSG_ERR("swScaler: %s is not supported as output format\n", vo_format_name(dstFormat));

1870

return NULL;

1871

}

1872

1873

/* sanity check */

1874

if(srcW<4 || srcH<1 || dstW<8 || dstH<1) //FIXME check if these are enough and try to lowwer them after fixing the relevant parts of the code

1875

{

1876

MSG_ERR("swScaler: %dx%d -> %dx%d is invalid scaling dimension\n",

1877

srcW, srcH, dstW, dstH);

1878

return NULL;

1879

}

1880

1881

if(!dstFilter) dstFilter= &dummyFilter;

1882

if(!srcFilter) srcFilter= &dummyFilter;

1883

1884

c= memalign(64, sizeof(SwsContext));

1885

memset(c, 0, sizeof(SwsContext));

1886

1887

c->srcW= srcW;

1888

c->srcH= srcH;

1889

c->dstW= dstW;

1890

c->dstH= dstH;

1891

c->lumXInc= ((srcW<<16) + (dstW>>1))/dstW;

1892

c->lumYInc= ((srcH<<16) + (dstH>>1))/dstH;

1893

c->flags= flags;

1894

c->dstFormat= dstFormat;

1895

c->srcFormat= srcFormat;

1896

c->origDstFormat= origDstFormat;

1897

c->origSrcFormat= origSrcFormat;

1898

c->vRounder= 4* 0x0001000100010001ULL;

1899

1900

usesHFilter= usesVFilter= 0;

1901

if(dstFilter->lumV!=NULL && dstFilter->lumV->length>1) usesVFilter=1;

1902

if(dstFilter->lumH!=NULL && dstFilter->lumH->length>1) usesHFilter=1;

1903

if(dstFilter->chrV!=NULL && dstFilter->chrV->length>1) usesVFilter=1;

1904

if(dstFilter->chrH!=NULL && dstFilter->chrH->length>1) usesHFilter=1;

1905

if(srcFilter->lumV!=NULL && srcFilter->lumV->length>1) usesVFilter=1;

1906

if(srcFilter->lumH!=NULL && srcFilter->lumH->length>1) usesHFilter=1;

1907

if(srcFilter->chrV!=NULL && srcFilter->chrV->length>1) usesVFilter=1;

1908

if(srcFilter->chrH!=NULL && srcFilter->chrH->length>1) usesHFilter=1;

1909

1910

getSubSampleFactors(&c->chrSrcHSubSample, &c->chrSrcVSubSample, srcFormat);

1911

getSubSampleFactors(&c->chrDstHSubSample, &c->chrDstVSubSample, dstFormat);

1912

1913

// reuse chroma for 2 pixles rgb/bgr unless user wants full chroma interpolation

1914

if((isBGR(dstFormat) || isRGB(dstFormat)) && !(flags&SWS_FULL_CHR_H_INT)) c->chrDstHSubSample=1;

1915

1916

// drop some chroma lines if the user wants it

1917

c->vChrDrop= (flags&SWS_SRC_V_CHR_DROP_MASK)>>SWS_SRC_V_CHR_DROP_SHIFT;

1918

c->chrSrcVSubSample+= c->vChrDrop;

1919

1920

// drop every 2. pixel for chroma calculation unless user wants full chroma

1921

if((isBGR(srcFormat) || isRGB(srcFormat)) && !(flags&SWS_FULL_CHR_H_INP))

1922

c->chrSrcHSubSample=1;

1923

1924

if(param){

1925

c->param[0] = param[0];

1926

c->param[1] = param[1];

1927

}else{

1928

c->param[0] =

1929

c->param[1] = SWS_PARAM_DEFAULT;

1930

}

1931

1932

c->chrIntHSubSample= c->chrDstHSubSample;

1933

c->chrIntVSubSample= c->chrSrcVSubSample;

1934

1935

// note the -((-x)>>y) is so that we allways round toward +inf

1936

c->chrSrcW= -((-srcW) >> c->chrSrcHSubSample);

1937

c->chrSrcH= -((-srcH) >> c->chrSrcVSubSample);

1938

c->chrDstW= -((-dstW) >> c->chrDstHSubSample);

1939

c->chrDstH= -((-dstH) >> c->chrDstVSubSample);

1940

1941

sws_setColorspaceDetails(c, Inverse_Table_6_9[SWS_CS_DEFAULT], 0, Inverse_Table_6_9[SWS_CS_DEFAULT] /* FIXME*/, 0, 0, 1<<16, 1<<16);

1942

1943

/* unscaled special Cases */

1944

if(unscaled && !usesHFilter && !usesVFilter)

1945

{

1946

/* yv12_to_nv12 */

1947

if(srcFormat == IMGFMT_YV12 && (dstFormat == IMGFMT_NV12 || dstFormat == IMGFMT_NV21))

1948

{

1949

c->swScale= PlanarToNV12Wrapper;

1950

}

1951

/* yuv2bgr */

1952

if((srcFormat==IMGFMT_YV12 || srcFormat==IMGFMT_422P) && (isBGR(dstFormat) || isRGB(dstFormat)))

1953

{

1954

c->swScale= yuv2rgb_get_func_ptr(c);

1955

}

1956

1957

if( srcFormat==IMGFMT_YVU9 && dstFormat==IMGFMT_YV12 )

1958

{

1959

c->swScale= yvu9toyv12Wrapper;

1960

}

1961

1962

/* bgr24toYV12 */

1963

if(srcFormat==IMGFMT_BGR24 && dstFormat==IMGFMT_YV12)

1964

c->swScale= bgr24toyv12Wrapper;

1965

1966

/* rgb/bgr -> rgb/bgr (no dither needed forms) */

1967

if( (isBGR(srcFormat) || isRGB(srcFormat))

1968

&& (isBGR(dstFormat) || isRGB(dstFormat))

1969

&& !needsDither)

1970

c->swScale= rgb2rgbWrapper;

1971

1972

/* LQ converters if -sws 0 or -sws 4*/

1973

if(c->flags&(SWS_FAST_BILINEAR|SWS_POINT)){

1974

/* rgb/bgr -> rgb/bgr (dither needed forms) */

1975

if( (isBGR(srcFormat) || isRGB(srcFormat))

1976

&& (isBGR(dstFormat) || isRGB(dstFormat))

1977

&& needsDither)

1978

c->swScale= rgb2rgbWrapper;

1979

1980

/* yv12_to_yuy2 */

1981

if(srcFormat == IMGFMT_YV12 &&

1982

(dstFormat == IMGFMT_YUY2 || dstFormat == IMGFMT_UYVY))

1983

{

1984

if (dstFormat == IMGFMT_YUY2)

1985

c->swScale= PlanarToYuy2Wrapper;

1986

else

1987

c->swScale= PlanarToUyvyWrapper;

1988

}

1989

}

1990

1991

#ifdef COMPILE_ALTIVEC

1992

if ((c->flags & SWS_CPU_CAPS_ALTIVEC) &&

1993

((srcFormat == IMGFMT_YV12 &&

1994

(dstFormat == IMGFMT_YUY2 || dstFormat == IMGFMT_UYVY)))) {

1995

// unscaled YV12 -> packed YUV, we want speed

1996

if (dstFormat == IMGFMT_YUY2)

1997

c->swScale= yv12toyuy2_unscaled_altivec;

1998

else

1999

c->swScale= yv12touyvy_unscaled_altivec;

2000

}

2001

#endif

2002

2003

/* simple copy */

2004

if( srcFormat == dstFormat

2005

|| (isPlanarYUV(srcFormat) && isGray(dstFormat))

2006

|| (isPlanarYUV(dstFormat) && isGray(srcFormat))

2007

)

2008

{

2009

c->swScale= simpleCopy;

2010

}

2011

2012

if(c->swScale){

2013

if(flags&SWS_PRINT_INFO)

2014

MSG_INFO("SwScaler: using unscaled %s -> %s special converter\n",

2015

vo_format_name(srcFormat), vo_format_name(dstFormat));

2016

return c;

2017

}

2018

}

2019

2020

if(flags & SWS_CPU_CAPS_MMX2)

2021

{

2022

c->canMMX2BeUsed= (dstW >=srcW && (dstW&31)==0 && (srcW&15)==0) ? 1 : 0;

2023

if(!c->canMMX2BeUsed && dstW >=srcW && (srcW&15)==0 && (flags&SWS_FAST_BILINEAR))

2024

{

2025

if(flags&SWS_PRINT_INFO)

2026

MSG_INFO("SwScaler: output Width is not a multiple of 32 -> no MMX2 scaler\n");

2027

}

2028

if(usesHFilter) c->canMMX2BeUsed=0;

2029

}

2030

else

2031

c->canMMX2BeUsed=0;

2032

2033

c->chrXInc= ((c->chrSrcW<<16) + (c->chrDstW>>1))/c->chrDstW;

2034

c->chrYInc= ((c->chrSrcH<<16) + (c->chrDstH>>1))/c->chrDstH;

2035

2036

// match pixel 0 of the src to pixel 0 of dst and match pixel n-2 of src to pixel n-2 of dst

2037

// but only for the FAST_BILINEAR mode otherwise do correct scaling

2038

// n-2 is the last chrominance sample available

2039

// this is not perfect, but noone shuld notice the difference, the more correct variant

2040

// would be like the vertical one, but that would require some special code for the

2041

// first and last pixel

2042

if(flags&SWS_FAST_BILINEAR)

2043

{

2044

if(c->canMMX2BeUsed)

2045

{

2046

c->lumXInc+= 20;

2047

c->chrXInc+= 20;

2048

}

2049

//we don't use the x86asm scaler if mmx is available

2050

else if(flags & SWS_CPU_CAPS_MMX)

2051

{

2052

c->lumXInc = ((srcW-2)<<16)/(dstW-2) - 20;

2053

c->chrXInc = ((c->chrSrcW-2)<<16)/(c->chrDstW-2) - 20;

2054

}

2055

}

2056

2057

/* precalculate horizontal scaler filter coefficients */

2058

{

2059

const int filterAlign=

2060

(flags & SWS_CPU_CAPS_MMX) ? 4 :

2061

(flags & SWS_CPU_CAPS_ALTIVEC) ? 8 :

2062

2063

2064

initFilter(&c->hLumFilter, &c->hLumFilterPos, &c->hLumFilterSize, c->lumXInc,

2065

srcW , dstW, filterAlign, 1<<14,

2066

(flags&SWS_BICUBLIN) ? (flags|SWS_BICUBIC) : flags,

2067

srcFilter->lumH, dstFilter->lumH, c->param);

2068

initFilter(&c->hChrFilter, &c->hChrFilterPos, &c->hChrFilterSize, c->chrXInc,

2069

c->chrSrcW, c->chrDstW, filterAlign, 1<<14,

2070

(flags&SWS_BICUBLIN) ? (flags|SWS_BILINEAR) : flags,

2071

srcFilter->chrH, dstFilter->chrH, c->param);

2072

2073

#if defined(ARCH_X86) || defined(ARCH_X86_64)

2074

// can't downscale !!!

2075

if(c->canMMX2BeUsed && (flags & SWS_FAST_BILINEAR))

2076

{

2077

#define MAX_FUNNY_CODE_SIZE 10000

2078

#ifdef MAP_ANONYMOUS

2079

c->funnyYCode = (uint8_t*)mmap(NULL, MAX_FUNNY_CODE_SIZE, PROT_EXEC | PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, 0, 0);

2080

c->funnyUVCode = (uint8_t*)mmap(NULL, MAX_FUNNY_CODE_SIZE, PROT_EXEC | PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, 0, 0);

2081

#else

2082

c->funnyYCode = (uint8_t*)memalign(32, MAX_FUNNY_CODE_SIZE);

2083

c->funnyUVCode = (uint8_t*)memalign(32, MAX_FUNNY_CODE_SIZE);

2084

#endif

2085

2086

c->lumMmx2Filter = (int16_t*)memalign(8, (dstW /8+8)*sizeof(int16_t));

2087

c->chrMmx2Filter = (int16_t*)memalign(8, (c->chrDstW /4+8)*sizeof(int16_t));

2088

c->lumMmx2FilterPos= (int32_t*)memalign(8, (dstW /2/8+8)*sizeof(int32_t));

2089

c->chrMmx2FilterPos= (int32_t*)memalign(8, (c->chrDstW/2/4+8)*sizeof(int32_t));

2090

2091

initMMX2HScaler( dstW, c->lumXInc, c->funnyYCode , c->lumMmx2Filter, c->lumMmx2FilterPos, 8);

2092

initMMX2HScaler(c->chrDstW, c->chrXInc, c->funnyUVCode, c->chrMmx2Filter, c->chrMmx2FilterPos, 4);

2093

}

2094

#endif

2095

} // Init Horizontal stuff

2096

2097

2098

2099

/* precalculate vertical scaler filter coefficients */

2100

{

2101

const int filterAlign=

2102

(flags & SWS_CPU_CAPS_ALTIVEC) ? 8 :

2103

2104

2105

initFilter(&c->vLumFilter, &c->vLumFilterPos, &c->vLumFilterSize, c->lumYInc,

2106

srcH , dstH, filterAlign, (1<<12)-4,

2107

(flags&SWS_BICUBLIN) ? (flags|SWS_BICUBIC) : flags,

2108

srcFilter->lumV, dstFilter->lumV, c->param);

2109

initFilter(&c->vChrFilter, &c->vChrFilterPos, &c->vChrFilterSize, c->chrYInc,

2110

c->chrSrcH, c->chrDstH, filterAlign, (1<<12)-4,

2111

(flags&SWS_BICUBLIN) ? (flags|SWS_BILINEAR) : flags,

2112

srcFilter->chrV, dstFilter->chrV, c->param);

2113

2114

#ifdef HAVE_ALTIVEC

2115

c->vYCoeffsBank = memalign (16, sizeof (vector signed short)*c->vLumFilterSize*c->dstH);

2116

c->vCCoeffsBank = memalign (16, sizeof (vector signed short)*c->vChrFilterSize*c->chrDstH);

2117

2118

for (i=0;i<c->vLumFilterSize*c->dstH;i++) {

2119

int j;

2120

short *p = (short *)&c->vYCoeffsBank[i];

2121

for (j=0;j<8;j++)

2122

p[j] = c->vLumFilter[i];

2123

}

2124

2125

for (i=0;i<c->vChrFilterSize*c->chrDstH;i++) {

2126

int j;

2127

short *p = (short *)&c->vCCoeffsBank[i];

2128

for (j=0;j<8;j++)

2129

p[j] = c->vChrFilter[i];

2130

}

2131

#endif

2132

}

2133

2134

// Calculate Buffer Sizes so that they won't run out while handling these damn slices

2135

c->vLumBufSize= c->vLumFilterSize;

2136

c->vChrBufSize= c->vChrFilterSize;

2137

for(i=0; i<dstH; i++)

2138

{

2139

int chrI= i*c->chrDstH / dstH;

2140

int nextSlice= MAX(c->vLumFilterPos[i ] + c->vLumFilterSize - 1,

2141

((c->vChrFilterPos[chrI] + c->vChrFilterSize - 1)<<c->chrSrcVSubSample));

2142

2143

nextSlice>>= c->chrSrcVSubSample;

2144

nextSlice<<= c->chrSrcVSubSample;

2145

if(c->vLumFilterPos[i ] + c->vLumBufSize < nextSlice)

2146

c->vLumBufSize= nextSlice - c->vLumFilterPos[i ];

2147

if(c->vChrFilterPos[chrI] + c->vChrBufSize < (nextSlice>>c->chrSrcVSubSample))

2148

c->vChrBufSize= (nextSlice>>c->chrSrcVSubSample) - c->vChrFilterPos[chrI];

2149

}

2150

2151

// allocate pixbufs (we use dynamic allocation because otherwise we would need to

2152

c->lumPixBuf= (int16_t**)memalign(4, c->vLumBufSize*2*sizeof(int16_t*));

2153

c->chrPixBuf= (int16_t**)memalign(4, c->vChrBufSize*2*sizeof(int16_t*));

2154

//Note we need at least one pixel more at the end because of the mmx code (just in case someone wanna replace the 4000/8000)

2155

/* align at 16 bytes for AltiVec */

2156

for(i=0; i<c->vLumBufSize; i++)

2157

c->lumPixBuf[i]= c->lumPixBuf[i+c->vLumBufSize]= (uint16_t*)memalign(16, 4000);

2158

for(i=0; i<c->vChrBufSize; i++)

2159

c->chrPixBuf[i]= c->chrPixBuf[i+c->vChrBufSize]= (uint16_t*)memalign(16, 8000);

2160

2161

//try to avoid drawing green stuff between the right end and the stride end

2162

for(i=0; i<c->vLumBufSize; i++) memset(c->lumPixBuf[i], 0, 4000);

2163

for(i=0; i<c->vChrBufSize; i++) memset(c->chrPixBuf[i], 64, 8000);

2164

2165

ASSERT(c->chrDstH <= dstH)

2166

2167

if(flags&SWS_PRINT_INFO)

2168

{

2169

#ifdef DITHER1XBPP

2170

char *dither= " dithered";

2171

#else

2172

char *dither= "";

2173

#endif

2174

if(flags&SWS_FAST_BILINEAR)

2175

MSG_INFO("\nSwScaler: FAST_BILINEAR scaler, ");

2176

else if(flags&SWS_BILINEAR)

2177

MSG_INFO("\nSwScaler: BILINEAR scaler, ");

2178

else if(flags&SWS_BICUBIC)

2179

MSG_INFO("\nSwScaler: BICUBIC scaler, ");

2180

else if(flags&SWS_X)

2181

MSG_INFO("\nSwScaler: Experimental scaler, ");

2182

else if(flags&SWS_POINT)

2183

MSG_INFO("\nSwScaler: Nearest Neighbor / POINT scaler, ");

2184

else if(flags&SWS_AREA)

2185

MSG_INFO("\nSwScaler: Area Averageing scaler, ");

2186

else if(flags&SWS_BICUBLIN)

2187

MSG_INFO("\nSwScaler: luma BICUBIC / chroma BILINEAR scaler, ");

2188

else if(flags&SWS_GAUSS)

2189

MSG_INFO("\nSwScaler: Gaussian scaler, ");

2190

else if(flags&SWS_SINC)

2191

MSG_INFO("\nSwScaler: Sinc scaler, ");

2192

else if(flags&SWS_LANCZOS)

2193

MSG_INFO("\nSwScaler: Lanczos scaler, ");

2194

else if(flags&SWS_SPLINE)

2195

MSG_INFO("\nSwScaler: Bicubic spline scaler, ");

2196

else

2197

MSG_INFO("\nSwScaler: ehh flags invalid?! ");

2198

2199

if(dstFormat==IMGFMT_BGR15 || dstFormat==IMGFMT_BGR16)

2200

MSG_INFO("from %s to%s %s ",

2201

vo_format_name(srcFormat), dither, vo_format_name(dstFormat));

2202

else

2203

MSG_INFO("from %s to %s ",

2204

vo_format_name(srcFormat), vo_format_name(dstFormat));

2205

2206

if(flags & SWS_CPU_CAPS_MMX2)

2207

MSG_INFO("using MMX2\n");

2208

else if(flags & SWS_CPU_CAPS_3DNOW)

2209

MSG_INFO("using 3DNOW\n");

2210

else if(flags & SWS_CPU_CAPS_MMX)

2211

MSG_INFO("using MMX\n");

2212

else if(flags & SWS_CPU_CAPS_ALTIVEC)

2213

MSG_INFO("using AltiVec\n");

2214

else

2215

MSG_INFO("using C\n");

2216

}

2217

2218

if(flags & SWS_PRINT_INFO)

2219

{

2220

if(flags & SWS_CPU_CAPS_MMX)

2221

{

2222

if(c->canMMX2BeUsed && (flags&SWS_FAST_BILINEAR))

2223

MSG_V("SwScaler: using FAST_BILINEAR MMX2 scaler for horizontal scaling\n");

2224

else

2225

{

2226

if(c->hLumFilterSize==4)

2227

MSG_V("SwScaler: using 4-tap MMX scaler for horizontal luminance scaling\n");

2228

else if(c->hLumFilterSize==8)

2229

MSG_V("SwScaler: using 8-tap MMX scaler for horizontal luminance scaling\n");

2230

else

2231

MSG_V("SwScaler: using n-tap MMX scaler for horizontal luminance scaling\n");

2232

2233

if(c->hChrFilterSize==4)

2234

MSG_V("SwScaler: using 4-tap MMX scaler for horizontal chrominance scaling\n");

2235

else if(c->hChrFilterSize==8)

2236

MSG_V("SwScaler: using 8-tap MMX scaler for horizontal chrominance scaling\n");

2237

else

2238

MSG_V("SwScaler: using n-tap MMX scaler for horizontal chrominance scaling\n");

2239

}

2240

}

2241

else

2242

{

2243

#if defined(ARCH_X86) || defined(ARCH_X86_64)

2244

MSG_V("SwScaler: using X86-Asm scaler for horizontal scaling\n");

2245

#else

2246

if(flags & SWS_FAST_BILINEAR)

2247

MSG_V("SwScaler: using FAST_BILINEAR C scaler for horizontal scaling\n");

2248

else

2249

MSG_V("SwScaler: using C scaler for horizontal scaling\n");

2250

#endif

2251

}

2252

if(isPlanarYUV(dstFormat))

2253

{

2254

if(c->vLumFilterSize==1)

2255

MSG_V("SwScaler: using 1-tap %s \"scaler\" for vertical scaling (YV12 like)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2256

else

2257

MSG_V("SwScaler: using n-tap %s scaler for vertical scaling (YV12 like)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2258

}

2259

else

2260

{

2261

if(c->vLumFilterSize==1 && c->vChrFilterSize==2)

2262

MSG_V("SwScaler: using 1-tap %s \"scaler\" for vertical luminance scaling (BGR)\n"

2263

"SwScaler: 2-tap scaler for vertical chrominance scaling (BGR)\n",(flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2264

else if(c->vLumFilterSize==2 && c->vChrFilterSize==2)

2265

MSG_V("SwScaler: using 2-tap linear %s scaler for vertical scaling (BGR)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2266

else

2267

MSG_V("SwScaler: using n-tap %s scaler for vertical scaling (BGR)\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2268

}

2269

2270

if(dstFormat==IMGFMT_BGR24)

2271

MSG_V("SwScaler: using %s YV12->BGR24 Converter\n",

2272

(flags & SWS_CPU_CAPS_MMX2) ? "MMX2" : ((flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C"));

2273

else if(dstFormat==IMGFMT_BGR32)

2274

MSG_V("SwScaler: using %s YV12->BGR32 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2275

else if(dstFormat==IMGFMT_BGR16)

2276

MSG_V("SwScaler: using %s YV12->BGR16 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2277

else if(dstFormat==IMGFMT_BGR15)

2278

MSG_V("SwScaler: using %s YV12->BGR15 Converter\n", (flags & SWS_CPU_CAPS_MMX) ? "MMX" : "C");

2279

2280

MSG_V("SwScaler: %dx%d -> %dx%d\n", srcW, srcH, dstW, dstH);

2281

}

2282

if(flags & SWS_PRINT_INFO)

2283

{

2284

MSG_DBG2("SwScaler:Lum srcW=%d srcH=%d dstW=%d dstH=%d xInc=%d yInc=%d\n",

2285

c->srcW, c->srcH, c->dstW, c->dstH, c->lumXInc, c->lumYInc);

2286

MSG_DBG2("SwScaler:Chr srcW=%d srcH=%d dstW=%d dstH=%d xInc=%d yInc=%d\n",

2287

c->chrSrcW, c->chrSrcH, c->chrDstW, c->chrDstH, c->chrXInc, c->chrYInc);

2288

}

2289

2290

c->swScale= getSwsFunc(flags);

2291

return c;

2292

}

2293

2294

/**

2295

* swscale warper, so we don't need to export the SwsContext.

2296

* assumes planar YUV to be in YUV order instead of YVU

2297

2298

int sws_scale_ordered(SwsContext *c, uint8_t* src[], int srcStride[], int srcSliceY,

2299

int srcSliceH, uint8_t* dst[], int dstStride[]){

2300

if (c->sliceDir == 0 && srcSliceY != 0 && srcSliceY + srcSliceH != c->srcH) {

2301

MSG_ERR("swScaler: slices start in the middle!\n");

2302

return 0;

2303

}

2304

if (c->sliceDir == 0) {

2305

if (srcSliceY == 0) c->sliceDir = 1; else c->sliceDir = -1;

2306

}

2307

2308

// copy strides, so they can safely be modified

2309

if (c->sliceDir == 1) {

2310

// slices go from top to bottom

2311

int srcStride2[3]= {srcStride[0], srcStride[1], srcStride[2]};

2312

int dstStride2[3]= {dstStride[0], dstStride[1], dstStride[2]};

2313

return c->swScale(c, src, srcStride2, srcSliceY, srcSliceH, dst, dstStride2);

2314

} else {

2315

// slices go from bottom to top => we flip the image internally

2316

uint8_t* src2[3]= {src[0] + (srcSliceH-1)*srcStride[0],

2317

src[1] + ((srcSliceH>>c->chrSrcVSubSample)-1)*srcStride[1],

2318

src[2] + ((srcSliceH>>c->chrSrcVSubSample)-1)*srcStride[2]

2319

};

2320

uint8_t* dst2[3]= {dst[0] + (c->dstH-1)*dstStride[0],

2321

dst[1] + ((c->dstH>>c->chrDstVSubSample)-1)*dstStride[1],

2322

dst[2] + ((c->dstH>>c->chrDstVSubSample)-1)*dstStride[2]};

2323

int srcStride2[3]= {-srcStride[0], -srcStride[1], -srcStride[2]};

2324

int dstStride2[3]= {-dstStride[0], -dstStride[1], -dstStride[2]};

2325

2326

return c->swScale(c, src2, srcStride2, c->srcH-srcSliceY-srcSliceH, srcSliceH, dst2, dstStride2);

2327

}

2328

}

2329

2330

/**

2331

* swscale warper, so we don't need to export the SwsContext

2332

2333

int sws_scale(SwsContext *c, uint8_t* srcParam[], int srcStrideParam[], int srcSliceY,

2334

int srcSliceH, uint8_t* dstParam[], int dstStrideParam[]){

2335

int srcStride[3];

2336

int dstStride[3];

2337

uint8_t *src[3];

2338

uint8_t *dst[3];

2339

sws_orderYUV(c->origSrcFormat, src, srcStride, srcParam, srcStrideParam);

2340

sws_orderYUV(c->origDstFormat, dst, dstStride, dstParam, dstStrideParam);

2341

//printf("sws: slice %d %d\n", srcSliceY, srcSliceH);

2342

2343

return c->swScale(c, src, srcStride, srcSliceY, srcSliceH, dst, dstStride);

2344

}

2345

2346

SwsFilter *sws_getDefaultFilter(float lumaGBlur, float chromaGBlur,

2347

float lumaSharpen, float chromaSharpen,

2348

float chromaHShift, float chromaVShift,

2349

int verbose)

2350

{

2351

SwsFilter *filter= malloc(sizeof(SwsFilter));

2352

2353

if(lumaGBlur!=0.0){

2354

filter->lumH= sws_getGaussianVec(lumaGBlur, 3.0);

2355

filter->lumV= sws_getGaussianVec(lumaGBlur, 3.0);

2356

}else{

2357

filter->lumH= sws_getIdentityVec();

2358

filter->lumV= sws_getIdentityVec();

2359

}

2360

2361

if(chromaGBlur!=0.0){

2362

filter->chrH= sws_getGaussianVec(chromaGBlur, 3.0);

2363

filter->chrV= sws_getGaussianVec(chromaGBlur, 3.0);

2364

}else{

2365

filter->chrH= sws_getIdentityVec();

2366

filter->chrV= sws_getIdentityVec();

2367

}

2368

2369

if(chromaSharpen!=0.0){

2370

SwsVector *id= sws_getIdentityVec();

2371

sws_scaleVec(filter->chrH, -chromaSharpen);

2372

sws_scaleVec(filter->chrV, -chromaSharpen);

2373

sws_addVec(filter->chrH, id);

2374

sws_addVec(filter->chrV, id);

2375

sws_freeVec(id);

2376

}

2377

2378

if(lumaSharpen!=0.0){

2379

SwsVector *id= sws_getIdentityVec();

2380

sws_scaleVec(filter->lumH, -lumaSharpen);

2381

sws_scaleVec(filter->lumV, -lumaSharpen);

2382

sws_addVec(filter->lumH, id);

2383

sws_addVec(filter->lumV, id);

2384

sws_freeVec(id);

2385

}

2386

2387

if(chromaHShift != 0.0)

2388

sws_shiftVec(filter->chrH, (int)(chromaHShift+0.5));

2389

2390

if(chromaVShift != 0.0)

2391

sws_shiftVec(filter->chrV, (int)(chromaVShift+0.5));

2392

2393

sws_normalizeVec(filter->chrH, 1.0);

2394

sws_normalizeVec(filter->chrV, 1.0);

2395

sws_normalizeVec(filter->lumH, 1.0);

2396

sws_normalizeVec(filter->lumV, 1.0);

2397

2398

if(verbose) sws_printVec(filter->chrH);

2399

if(verbose) sws_printVec(filter->lumH);

2400

2401

return filter;

2402

}

2403

2404

/**

2405

* returns a normalized gaussian curve used to filter stuff

2406

* quality=3 is high quality, lowwer is lowwer quality

2407

2408

SwsVector *sws_getGaussianVec(double variance, double quality){

2409

const int length= (int)(variance*quality + 0.5) | 1;

2410

int i;

2411

double *coeff= memalign(sizeof(double), length*sizeof(double));

2412

double middle= (length-1)*0.5;

2413

SwsVector *vec= malloc(sizeof(SwsVector));

2414

2415

vec->coeff= coeff;

2416

vec->length= length;

2417

2418

for(i=0; i<length; i++)

2419

{

2420

double dist= i-middle;

2421

coeff[i]= exp( -dist*dist/(2*variance*variance) ) / sqrt(2*variance*PI);

2422

}

2423

2424

sws_normalizeVec(vec, 1.0);

2425

2426

return vec;

2427

}

2428

2429

SwsVector *sws_getConstVec(double c, int length){

2430

int i;

2431

double *coeff= memalign(sizeof(double), length*sizeof(double));

2432

SwsVector *vec= malloc(sizeof(SwsVector));

2433

2434

vec->coeff= coeff;

2435

vec->length= length;

2436

2437

for(i=0; i<length; i++)

2438

coeff[i]= c;

2439

2440

return vec;

2441

}

2442

2443

2444

SwsVector *sws_getIdentityVec(void){

2445

return sws_getConstVec(1.0, 1);

2446

}

2447

2448

double sws_dcVec(SwsVector *a){

2449

int i;

2450

double sum=0;

2451

2452

for(i=0; i<a->length; i++)

2453

sum+= a->coeff[i];

2454

2455

return sum;

2456

}

2457

2458

void sws_scaleVec(SwsVector *a, double scalar){

2459

int i;

2460

2461

for(i=0; i<a->length; i++)

2462

a->coeff[i]*= scalar;

2463

}

2464

2465

void sws_normalizeVec(SwsVector *a, double height){

2466

sws_scaleVec(a, height/sws_dcVec(a));

2467

}

2468

2469

static SwsVector *sws_getConvVec(SwsVector *a, SwsVector *b){

2470

int length= a->length + b->length - 1;

2471

double *coeff= memalign(sizeof(double), length*sizeof(double));

2472

int i, j;

2473

SwsVector *vec= malloc(sizeof(SwsVector));

2474

2475

vec->coeff= coeff;

2476

vec->length= length;

2477

2478

for(i=0; i<length; i++) coeff[i]= 0.0;

2479

2480

for(i=0; i<a->length; i++)

2481

{

2482

for(j=0; j<b->length; j++)

2483

{

2484

coeff[i+j]+= a->coeff[i]*b->coeff[j];

2485

}

2486

}

2487

2488

return vec;

2489

}

2490

2491

static SwsVector *sws_sumVec(SwsVector *a, SwsVector *b){

2492

int length= MAX(a->length, b->length);

2493

double *coeff= memalign(sizeof(double), length*sizeof(double));

2494

int i;

2495

SwsVector *vec= malloc(sizeof(SwsVector));

2496

2497

vec->coeff= coeff;

2498

vec->length= length;

2499

2500

for(i=0; i<length; i++) coeff[i]= 0.0;

2501

2502

for(i=0; i<a->length; i++) coeff[i + (length-1)/2 - (a->length-1)/2]+= a->coeff[i];

2503

for(i=0; i<b->length; i++) coeff[i + (length-1)/2 - (b->length-1)/2]+= b->coeff[i];

2504

2505

return vec;

2506

}

2507

2508

static SwsVector *sws_diffVec(SwsVector *a, SwsVector *b){

2509

int length= MAX(a->length, b->length);

2510

double *coeff= memalign(sizeof(double), length*sizeof(double));

2511

int i;

2512

SwsVector *vec= malloc(sizeof(SwsVector));

2513

2514

vec->coeff= coeff;

2515

vec->length= length;

2516

2517

for(i=0; i<length; i++) coeff[i]= 0.0;

2518

2519

for(i=0; i<a->length; i++) coeff[i + (length-1)/2 - (a->length-1)/2]+= a->coeff[i];

2520

for(i=0; i<b->length; i++) coeff[i + (length-1)/2 - (b->length-1)/2]-= b->coeff[i];

2521

2522

return vec;

2523

}

2524

2525

/* shift left / or right if "shift" is negative */

2526

static SwsVector *sws_getShiftedVec(SwsVector *a, int shift){

2527

int length= a->length + ABS(shift)*2;

2528

double *coeff= memalign(sizeof(double), length*sizeof(double));

2529

int i;

2530

SwsVector *vec= malloc(sizeof(SwsVector));

2531

2532

vec->coeff= coeff;

2533

vec->length= length;

2534

2535

for(i=0; i<length; i++) coeff[i]= 0.0;

2536

2537

for(i=0; i<a->length; i++)

2538

{

2539

coeff[i + (length-1)/2 - (a->length-1)/2 - shift]= a->coeff[i];

2540

}

2541

2542

return vec;

2543

}

2544

2545

void sws_shiftVec(SwsVector *a, int shift){

2546

SwsVector *shifted= sws_getShiftedVec(a, shift);

2547

free(a->coeff);

2548

a->coeff= shifted->coeff;

2549

a->length= shifted->length;

2550

free(shifted);

2551

}

2552

2553

void sws_addVec(SwsVector *a, SwsVector *b){

2554

SwsVector *sum= sws_sumVec(a, b);

2555

free(a->coeff);

2556

a->coeff= sum->coeff;

2557

a->length= sum->length;

2558

free(sum);

2559

}

2560

2561

void sws_subVec(SwsVector *a, SwsVector *b){

2562

SwsVector *diff= sws_diffVec(a, b);

2563

free(a->coeff);

2564

a->coeff= diff->coeff;

2565

a->length= diff->length;

2566

free(diff);

2567

}

2568

2569

void sws_convVec(SwsVector *a, SwsVector *b){

2570

SwsVector *conv= sws_getConvVec(a, b);

2571

free(a->coeff);

2572

a->coeff= conv->coeff;

2573

a->length= conv->length;

2574

free(conv);

2575

}

2576

2577

SwsVector *sws_cloneVec(SwsVector *a){

2578

double *coeff= memalign(sizeof(double), a->length*sizeof(double));

2579

int i;

2580

SwsVector *vec= malloc(sizeof(SwsVector));

2581

2582

vec->coeff= coeff;

2583

vec->length= a->length;

2584

2585

for(i=0; i<a->length; i++) coeff[i]= a->coeff[i];

2586

2587

return vec;

2588

}

2589

2590

void sws_printVec(SwsVector *a){

2591

int i;

2592

double max=0;

2593

double min=0;

2594

double range;

2595

2596

for(i=0; i<a->length; i++)

2597

if(a->coeff[i]>max) max= a->coeff[i];

2598

2599

for(i=0; i<a->length; i++)

2600

if(a->coeff[i]<min) min= a->coeff[i];

2601

2602

range= max - min;

2603

2604

for(i=0; i<a->length; i++)

2605

{

2606

int x= (int)((a->coeff[i]-min)*60.0/range +0.5);

2607

MSG_DBG2("%1.3f ", a->coeff[i]);

2608

for(;x>0; x--) MSG_DBG2(" ");

2609

MSG_DBG2("|\n");

2610

}

2611

}

2612

2613

void sws_freeVec(SwsVector *a){

2614

if(!a) return;

2615

if(a->coeff) free(a->coeff);

2616

a->coeff=NULL;

2617

a->length=0;

2618

free(a);

2619

}

2620

2621

void sws_freeFilter(SwsFilter *filter){

2622

if(!filter) return;

2623

2624

if(filter->lumH) sws_freeVec(filter->lumH);

2625

if(filter->lumV) sws_freeVec(filter->lumV);

2626

if(filter->chrH) sws_freeVec(filter->chrH);

2627

if(filter->chrV) sws_freeVec(filter->chrV);

2628

free(filter);

2629

}

2630

2631

2632

void sws_freeContext(SwsContext *c){

2633

int i;

2634

if(!c) return;

2635

2636

if(c->lumPixBuf)

2637

{

2638

for(i=0; i<c->vLumBufSize; i++)

2639

{

2640

if(c->lumPixBuf[i]) free(c->lumPixBuf[i]);

2641

c->lumPixBuf[i]=NULL;

2642

}

2643

free(c->lumPixBuf);

2644

c->lumPixBuf=NULL;

2645

}

2646

2647

if(c->chrPixBuf)

2648

{

2649

for(i=0; i<c->vChrBufSize; i++)

2650

{

2651

if(c->chrPixBuf[i]) free(c->chrPixBuf[i]);

2652

c->chrPixBuf[i]=NULL;

2653

}

2654

free(c->chrPixBuf);

2655

c->chrPixBuf=NULL;

2656

}

2657

2658

if(c->vLumFilter) free(c->vLumFilter);

2659

c->vLumFilter = NULL;

2660

if(c->vChrFilter) free(c->vChrFilter);

2661

c->vChrFilter = NULL;

2662

if(c->hLumFilter) free(c->hLumFilter);

2663

c->hLumFilter = NULL;

2664

if(c->hChrFilter) free(c->hChrFilter);

2665

c->hChrFilter = NULL;

2666

#ifdef HAVE_ALTIVEC

2667

if(c->vYCoeffsBank) free(c->vYCoeffsBank);

2668

c->vYCoeffsBank = NULL;

2669

if(c->vCCoeffsBank) free(c->vCCoeffsBank);

2670

c->vCCoeffsBank = NULL;

2671

#endif

2672

2673

if(c->vLumFilterPos) free(c->vLumFilterPos);

2674

c->vLumFilterPos = NULL;

2675

if(c->vChrFilterPos) free(c->vChrFilterPos);

2676

c->vChrFilterPos = NULL;

2677

if(c->hLumFilterPos) free(c->hLumFilterPos);

2678

c->hLumFilterPos = NULL;

2679

if(c->hChrFilterPos) free(c->hChrFilterPos);

2680

c->hChrFilterPos = NULL;

2681

2682

#if defined(ARCH_X86) || defined(ARCH_X86_64)

2683

#ifdef MAP_ANONYMOUS

2684

if(c->funnyYCode) munmap(c->funnyYCode, MAX_FUNNY_CODE_SIZE);

2685

if(c->funnyUVCode) munmap(c->funnyUVCode, MAX_FUNNY_CODE_SIZE);

2686

#else

2687

if(c->funnyYCode) free(c->funnyYCode);

2688

if(c->funnyUVCode) free(c->funnyUVCode);

2689

#endif

2690

c->funnyYCode=NULL;

2691

c->funnyUVCode=NULL;

2692

#endif

2693

2694

if(c->lumMmx2Filter) free(c->lumMmx2Filter);

2695

c->lumMmx2Filter=NULL;

2696

if(c->chrMmx2Filter) free(c->chrMmx2Filter);

2697

c->chrMmx2Filter=NULL;

2698

if(c->lumMmx2FilterPos) free(c->lumMmx2FilterPos);

2699

c->lumMmx2FilterPos=NULL;

2700

if(c->chrMmx2FilterPos) free(c->chrMmx2FilterPos);

2701

c->chrMmx2FilterPos=NULL;

2702

if(c->yuvTable) free(c->yuvTable);

2703

c->yuvTable=NULL;

2704

2705

free(c);

2706

}

2707

Older »