mirror of
https://github.com/mpv-player/mpv
synced 2024-12-27 09:32:40 +00:00
9a210ca2d5
Something like "char *s = ...; isdigit(s[0]);" triggers undefined behavior, because char can be signed, and thus s[0] can be a negative value. The is*() functions require unsigned char _or_ EOF. EOF is a special value outside of unsigned char range, thus the argument to the is*() functions can't be a char. This undefined behavior can actually trigger crashes if the implementation of these functions e.g. uses lookup tables, which are then indexed with out-of-range values. Replace all <ctype.h> uses with our own custom mp_is*() functions added with misc/ctype.h. As a bonus, these functions are locale-independent. (Although currently, we _require_ C locale for other reasons.)
2223 lines
78 KiB
C
2223 lines
78 KiB
C
/*
|
|
* This file is part of MPlayer.
|
|
*
|
|
* Original author: Reimar Doeffinger <Reimar.Doeffinger@gmx.de>
|
|
*
|
|
* MPlayer is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* MPlayer is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with MPlayer; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* You can alternatively redistribute this file and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <math.h>
|
|
#include <stdbool.h>
|
|
#include <assert.h>
|
|
|
|
#include "config.h"
|
|
#include "talloc.h"
|
|
#include "common/msg.h"
|
|
#include "misc/ctype.h"
|
|
#include "options/m_option.h"
|
|
#include "vo.h"
|
|
#include "video/vfcap.h"
|
|
#include "video/mp_image.h"
|
|
#include "sub/osd.h"
|
|
|
|
#include "gl_common.h"
|
|
#include "gl_osd.h"
|
|
#include "video/memcpy_pic.h"
|
|
#include "pnm_loader.h"
|
|
|
|
//for gl_priv.use_yuv
|
|
#define MASK_ALL_YUV (~(1 << YUV_CONVERSION_NONE))
|
|
#define MASK_NOT_COMBINERS (~((1 << YUV_CONVERSION_NONE) | (1 << YUV_CONVERSION_COMBINERS)))
|
|
#define MASK_GAMMA_SUPPORT (MASK_NOT_COMBINERS & ~(1 << YUV_CONVERSION_FRAGMENT))
|
|
|
|
struct gl_priv {
|
|
MPGLContext *glctx;
|
|
GL *gl;
|
|
|
|
int allow_sw;
|
|
|
|
int scaled_osd;
|
|
struct mpgl_osd *osd;
|
|
int osd_color;
|
|
double osd_pts;
|
|
|
|
int use_ycbcr;
|
|
int use_yuv;
|
|
int is_yuv;
|
|
int lscale;
|
|
int cscale;
|
|
float filter_strength;
|
|
float noise_strength;
|
|
int yuvconvtype;
|
|
int use_rectangle;
|
|
int err_shown;
|
|
uint32_t image_width;
|
|
uint32_t image_height;
|
|
uint32_t image_format;
|
|
int many_fmts;
|
|
int have_texture_rg;
|
|
int max_tex_component_size;
|
|
int ati_hack;
|
|
int force_pbo;
|
|
int use_glFinish;
|
|
int swap_interval;
|
|
GLenum target;
|
|
GLint texfmt;
|
|
GLenum gl_format;
|
|
GLenum gl_type;
|
|
GLuint buffer;
|
|
GLuint buffer_uv[2];
|
|
int buffersize;
|
|
int buffersize_uv;
|
|
void *bufferptr;
|
|
void *bufferptr_uv[2];
|
|
GLuint fragprog;
|
|
GLuint default_texs[22];
|
|
char *custom_prog;
|
|
char *custom_tex;
|
|
int custom_tlin;
|
|
int custom_trect;
|
|
int mipmap_gen;
|
|
int stereo_mode;
|
|
char *backend_arg;
|
|
|
|
struct mp_csp_equalizer video_eq;
|
|
|
|
int texture_width;
|
|
int texture_height;
|
|
int mpi_flipped;
|
|
int vo_flipped;
|
|
|
|
struct mp_rect src_rect; // displayed part of the source video
|
|
struct mp_rect dst_rect; // video rectangle on output window
|
|
struct mp_osd_res osd_res;
|
|
|
|
int slice_height;
|
|
};
|
|
|
|
static int glFindFormat(uint32_t format, int have_texture_rg, int *bpp,
|
|
GLint *gl_texfmt, GLenum *gl_format, GLenum *gl_type);
|
|
static void glCreateClearTex(GL *gl, GLenum target, GLenum fmt, GLenum format,
|
|
GLenum type, GLint filter, int w, int h,
|
|
unsigned char val);
|
|
static int glCreatePPMTex(GL *gl, GLenum target, GLenum fmt, GLint filter,
|
|
FILE *f, int *width, int *height, int *maxval);
|
|
static void glDrawTex(GL *gl, GLfloat x, GLfloat y, GLfloat w, GLfloat h,
|
|
GLfloat tx, GLfloat ty, GLfloat tw, GLfloat th,
|
|
int sx, int sy, int rect_tex, int is_yv12, int flip);
|
|
static int loadGPUProgram(struct vo *vo, GL *gl, GLenum target, char *prog);
|
|
//! do not use YUV conversion, this should always stay 0
|
|
#define YUV_CONVERSION_NONE 0
|
|
//! use nVidia specific register combiners for YUV conversion
|
|
//! implementation has been removed
|
|
#define YUV_CONVERSION_COMBINERS 1
|
|
//! use a fragment program for YUV conversion
|
|
#define YUV_CONVERSION_FRAGMENT 2
|
|
//! use a fragment program for YUV conversion with gamma using POW
|
|
#define YUV_CONVERSION_FRAGMENT_POW 3
|
|
//! use a fragment program with additional table lookup for YUV conversion
|
|
#define YUV_CONVERSION_FRAGMENT_LOOKUP 4
|
|
//! use ATI specific register combiners ("fragment program")
|
|
#define YUV_CONVERSION_COMBINERS_ATI 5
|
|
//! use a fragment program with 3D table lookup for YUV conversion
|
|
#define YUV_CONVERSION_FRAGMENT_LOOKUP3D 6
|
|
//! use ATI specific "text" register combiners ("fragment program")
|
|
#define YUV_CONVERSION_TEXT_FRAGMENT 7
|
|
//! use normal bilinear scaling for textures
|
|
#define YUV_SCALER_BILIN 0
|
|
//! use higher quality bicubic scaling for textures
|
|
#define YUV_SCALER_BICUB 1
|
|
//! use cubic scaling in X and normal linear scaling in Y direction
|
|
#define YUV_SCALER_BICUB_X 2
|
|
//! use cubic scaling without additional lookup texture
|
|
#define YUV_SCALER_BICUB_NOTEX 3
|
|
#define YUV_SCALER_UNSHARP 4
|
|
#define YUV_SCALER_UNSHARP2 5
|
|
//! mask for conversion type
|
|
#define YUV_CONVERSION_MASK 0xF
|
|
//! mask for scaler type
|
|
#define YUV_SCALER_MASK 0xF
|
|
//! shift value for luminance scaler type
|
|
#define YUV_LUM_SCALER_SHIFT 8
|
|
//! shift value for chrominance scaler type
|
|
#define YUV_CHROM_SCALER_SHIFT 12
|
|
//! extract conversion out of type
|
|
#define YUV_CONVERSION(t) ((t) & YUV_CONVERSION_MASK)
|
|
//! extract luminance scaler out of type
|
|
#define YUV_LUM_SCALER(t) (((t) >> YUV_LUM_SCALER_SHIFT) & YUV_SCALER_MASK)
|
|
//! extract chrominance scaler out of type
|
|
#define YUV_CHROM_SCALER(t) (((t) >> YUV_CHROM_SCALER_SHIFT) & YUV_SCALER_MASK)
|
|
#define SET_YUV_CONVERSION(c) ((c) & YUV_CONVERSION_MASK)
|
|
#define SET_YUV_LUM_SCALER(s) (((s) & YUV_SCALER_MASK) << YUV_LUM_SCALER_SHIFT)
|
|
#define SET_YUV_CHROM_SCALER(s) (((s) & YUV_SCALER_MASK) << YUV_CHROM_SCALER_SHIFT)
|
|
//! returns whether the yuv conversion supports large brightness range etc.
|
|
static inline int glYUVLargeRange(int conv)
|
|
{
|
|
switch (conv) {
|
|
case YUV_CONVERSION_NONE:
|
|
case YUV_CONVERSION_COMBINERS_ATI:
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP3D:
|
|
case YUV_CONVERSION_TEXT_FRAGMENT:
|
|
return 0;
|
|
}
|
|
return 1;
|
|
}
|
|
typedef struct {
|
|
GLenum target;
|
|
int type;
|
|
struct mp_csp_params csp_params;
|
|
int texw;
|
|
int texh;
|
|
int chrom_texw;
|
|
int chrom_texh;
|
|
float filter_strength;
|
|
float noise_strength;
|
|
} gl_conversion_params_t;
|
|
|
|
static int glAutodetectYUVConversion(GL *gl);
|
|
static void glSetupYUVConversion(struct vo *vo, GL *gl,
|
|
gl_conversion_params_t *params);
|
|
static void glEnableYUVConversion(GL *gl, GLenum target, int type);
|
|
static void glDisableYUVConversion(GL *gl, GLenum target, int type);
|
|
|
|
//! always return this format as internal texture format in glFindFormat
|
|
#define TEXTUREFORMAT_ALWAYS GL_RGB8
|
|
#undef TEXTUREFORMAT_ALWAYS
|
|
|
|
/**
|
|
* \brief find the OpenGL settings coresponding to format.
|
|
*
|
|
* All parameters may be NULL.
|
|
* \param fmt MPlayer format to analyze.
|
|
* \param dummy reserved
|
|
* \param gl_texfmt [OUT] internal texture format that fits the
|
|
* image format, not necessarily the best for performance.
|
|
* \param gl_format [OUT] OpenGL format for this image format.
|
|
* \param gl_type [OUT] OpenGL type for this image format.
|
|
* \return 1 if format is supported by OpenGL, 0 if not.
|
|
* \ingroup gltexture
|
|
*/
|
|
static int glFindFormat(uint32_t fmt, int have_texture_rg, int *dummy,
|
|
GLint *gl_texfmt, GLenum *gl_format, GLenum *gl_type)
|
|
{
|
|
int supported = 1;
|
|
GLenum dummy2;
|
|
GLint dummy3;
|
|
if (!gl_texfmt)
|
|
gl_texfmt = &dummy3;
|
|
if (!gl_format)
|
|
gl_format = &dummy2;
|
|
if (!gl_type)
|
|
gl_type = &dummy2;
|
|
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(fmt);
|
|
if (desc.flags & MP_IMGFLAG_YUV_P) {
|
|
// reduce the possible cases a bit
|
|
if (desc.plane_bits > 8)
|
|
fmt = IMGFMT_420P16;
|
|
else
|
|
fmt = IMGFMT_420P;
|
|
}
|
|
|
|
*gl_texfmt = 3;
|
|
switch (fmt) {
|
|
case IMGFMT_RGB48:
|
|
*gl_format = GL_RGB;
|
|
*gl_type = GL_UNSIGNED_SHORT;
|
|
break;
|
|
case IMGFMT_RGB24:
|
|
*gl_format = GL_RGB;
|
|
*gl_type = GL_UNSIGNED_BYTE;
|
|
break;
|
|
case IMGFMT_RGBA:
|
|
*gl_texfmt = 4;
|
|
*gl_format = GL_RGBA;
|
|
*gl_type = GL_UNSIGNED_BYTE;
|
|
break;
|
|
case IMGFMT_420P16:
|
|
supported = 0; // no native YUV support
|
|
*gl_texfmt = have_texture_rg ? GL_R16 : GL_LUMINANCE16;
|
|
*gl_format = have_texture_rg ? GL_RED : GL_LUMINANCE;
|
|
*gl_type = GL_UNSIGNED_SHORT;
|
|
break;
|
|
case IMGFMT_420P:
|
|
supported = 0; // no native YV12 support
|
|
case IMGFMT_Y8:
|
|
*gl_texfmt = 1;
|
|
*gl_format = GL_LUMINANCE;
|
|
*gl_type = GL_UNSIGNED_BYTE;
|
|
break;
|
|
case IMGFMT_UYVY:
|
|
*gl_texfmt = GL_YCBCR_MESA;
|
|
*gl_format = GL_YCBCR_MESA;
|
|
*gl_type = fmt == IMGFMT_UYVY ? GL_UNSIGNED_SHORT_8_8 : GL_UNSIGNED_SHORT_8_8_REV;
|
|
break;
|
|
#if 0
|
|
// we do not support palettized formats, although the format the
|
|
// swscale produces works
|
|
case IMGFMT_RGB8:
|
|
*gl_format = GL_RGB;
|
|
*gl_type = GL_UNSIGNED_BYTE_2_3_3_REV;
|
|
break;
|
|
#endif
|
|
case IMGFMT_BGR555:
|
|
*gl_format = GL_RGBA;
|
|
*gl_type = GL_UNSIGNED_SHORT_1_5_5_5_REV;
|
|
break;
|
|
case IMGFMT_BGR565:
|
|
*gl_format = GL_RGB;
|
|
*gl_type = GL_UNSIGNED_SHORT_5_6_5_REV;
|
|
break;
|
|
#if 0
|
|
case IMGFMT_BGR8:
|
|
// special case as red and blue have a different number of bits.
|
|
// GL_BGR and GL_UNSIGNED_BYTE_3_3_2 isn't supported at least
|
|
// by nVidia drivers, and in addition would give more bits to
|
|
// blue than to red, which isn't wanted
|
|
*gl_format = GL_RGB;
|
|
*gl_type = GL_UNSIGNED_BYTE_3_3_2;
|
|
break;
|
|
#endif
|
|
case IMGFMT_RGB555:
|
|
*gl_format = GL_BGRA;
|
|
*gl_type = GL_UNSIGNED_SHORT_1_5_5_5_REV;
|
|
break;
|
|
case IMGFMT_RGB565:
|
|
*gl_format = GL_RGB;
|
|
*gl_type = GL_UNSIGNED_SHORT_5_6_5;
|
|
break;
|
|
case IMGFMT_BGR24:
|
|
*gl_format = GL_BGR;
|
|
*gl_type = GL_UNSIGNED_BYTE;
|
|
break;
|
|
case IMGFMT_BGRA:
|
|
*gl_texfmt = 4;
|
|
*gl_format = GL_BGRA;
|
|
*gl_type = GL_UNSIGNED_BYTE;
|
|
break;
|
|
default:
|
|
*gl_texfmt = 4;
|
|
*gl_format = GL_RGBA;
|
|
*gl_type = GL_UNSIGNED_BYTE;
|
|
supported = 0;
|
|
}
|
|
#ifdef TEXTUREFORMAT_ALWAYS
|
|
*gl_texfmt = TEXTUREFORMAT_ALWAYS;
|
|
#endif
|
|
return supported;
|
|
}
|
|
|
|
/**
|
|
* \brief create a texture and set some defaults
|
|
* \param target texture taget, usually GL_TEXTURE_2D
|
|
* \param fmt internal texture format
|
|
* \param format texture host data format
|
|
* \param type texture host data type
|
|
* \param filter filter used for scaling, e.g. GL_LINEAR
|
|
* \param w texture width
|
|
* \param h texture height
|
|
* \param val luminance value to fill texture with
|
|
* \ingroup gltexture
|
|
*/
|
|
static void glCreateClearTex(GL *gl, GLenum target, GLenum fmt, GLenum format,
|
|
GLenum type, GLint filter, int w, int h,
|
|
unsigned char val)
|
|
{
|
|
GLfloat fval = (GLfloat)val / 255.0;
|
|
GLfloat border[4] = {
|
|
fval, fval, fval, fval
|
|
};
|
|
int stride;
|
|
char *init;
|
|
if (w == 0)
|
|
w = 1;
|
|
if (h == 0)
|
|
h = 1;
|
|
stride = w * glFmt2bpp(format, type);
|
|
if (!stride)
|
|
return;
|
|
init = malloc(stride * h);
|
|
memset(init, val, stride * h);
|
|
glAdjustAlignment(gl, stride);
|
|
gl->PixelStorei(GL_UNPACK_ROW_LENGTH, w);
|
|
gl->TexImage2D(target, 0, fmt, w, h, 0, format, type, init);
|
|
gl->TexParameterf(target, GL_TEXTURE_PRIORITY, 1.0);
|
|
gl->TexParameteri(target, GL_TEXTURE_MIN_FILTER, filter);
|
|
gl->TexParameteri(target, GL_TEXTURE_MAG_FILTER, filter);
|
|
gl->TexParameteri(target, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
|
|
gl->TexParameteri(target, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE);
|
|
// Border texels should not be used with CLAMP_TO_EDGE
|
|
// We set a sane default anyway.
|
|
gl->TexParameterfv(target, GL_TEXTURE_BORDER_COLOR, border);
|
|
free(init);
|
|
}
|
|
|
|
static GLint detect_hqtexfmt(GL *gl)
|
|
{
|
|
const char *extensions = (const char *)gl->GetString(GL_EXTENSIONS);
|
|
if (strstr(extensions, "_texture_float"))
|
|
return GL_RGB32F;
|
|
else if (strstr(extensions, "NV_float_buffer"))
|
|
return GL_FLOAT_RGB32_NV;
|
|
return GL_RGB16;
|
|
}
|
|
|
|
/**
|
|
* \brief creates a texture from a PPM file
|
|
* \param target texture taget, usually GL_TEXTURE_2D
|
|
* \param fmt internal texture format, 0 for default
|
|
* \param filter filter used for scaling, e.g. GL_LINEAR
|
|
* \param f file to read PPM from
|
|
* \param width [out] width of texture
|
|
* \param height [out] height of texture
|
|
* \param maxval [out] maxval value from PPM file
|
|
* \return 0 on error, 1 otherwise
|
|
* \ingroup gltexture
|
|
*/
|
|
static int glCreatePPMTex(GL *gl, GLenum target, GLenum fmt, GLint filter,
|
|
FILE *f, int *width, int *height, int *maxval)
|
|
{
|
|
int w, h, m, bpp;
|
|
GLenum type;
|
|
uint8_t *data = read_pnm(f, &w, &h, &bpp, &m);
|
|
GLint hqtexfmt = detect_hqtexfmt(gl);
|
|
if (!data || (bpp != 3 && bpp != 6)) {
|
|
free(data);
|
|
return 0;
|
|
}
|
|
if (!fmt) {
|
|
fmt = bpp == 6 ? hqtexfmt : 3;
|
|
if (fmt == GL_FLOAT_RGB32_NV && target != GL_TEXTURE_RECTANGLE)
|
|
fmt = GL_RGB16;
|
|
}
|
|
type = bpp == 6 ? GL_UNSIGNED_SHORT : GL_UNSIGNED_BYTE;
|
|
glCreateClearTex(gl, target, fmt, GL_RGB, type, filter, w, h, 0);
|
|
glUploadTex(gl, target, GL_RGB, type,
|
|
data, w * bpp, 0, 0, w, h, 0);
|
|
free(data);
|
|
if (width)
|
|
*width = w;
|
|
if (height)
|
|
*height = h;
|
|
if (maxval)
|
|
*maxval = m;
|
|
return 1;
|
|
}
|
|
|
|
|
|
/**
|
|
* \brief Setup ATI version of register combiners for YUV to RGB conversion.
|
|
* \param csp_params parameters used for colorspace conversion
|
|
* \param text if set use the GL_ATI_text_fragment_shader API as
|
|
* used on OS X.
|
|
*/
|
|
static void glSetupYUVFragmentATI(struct vo *vo, GL *gl,
|
|
struct mp_csp_params *csp_params, int text)
|
|
{
|
|
GLint i;
|
|
float yuv2rgb[3][4];
|
|
|
|
gl->GetIntegerv(GL_MAX_TEXTURE_UNITS, &i);
|
|
if (i < 3)
|
|
MP_ERR(vo, "3 texture units needed for YUV combiner (ATI) support (found %i)\n", i);
|
|
|
|
mp_get_yuv2rgb_coeffs(csp_params, yuv2rgb);
|
|
for (i = 0; i < 3; i++) {
|
|
int j;
|
|
yuv2rgb[i][3] -= -0.5 * (yuv2rgb[i][1] + yuv2rgb[i][2]);
|
|
for (j = 0; j < 4; j++) {
|
|
yuv2rgb[i][j] *= 0.125;
|
|
yuv2rgb[i][j] += 0.5;
|
|
if (yuv2rgb[i][j] > 1)
|
|
yuv2rgb[i][j] = 1;
|
|
if (yuv2rgb[i][j] < 0)
|
|
yuv2rgb[i][j] = 0;
|
|
}
|
|
}
|
|
if (text == 0) {
|
|
GLfloat c0[4] = { yuv2rgb[0][0], yuv2rgb[1][0], yuv2rgb[2][0] };
|
|
GLfloat c1[4] = { yuv2rgb[0][1], yuv2rgb[1][1], yuv2rgb[2][1] };
|
|
GLfloat c2[4] = { yuv2rgb[0][2], yuv2rgb[1][2], yuv2rgb[2][2] };
|
|
GLfloat c3[4] = { yuv2rgb[0][3], yuv2rgb[1][3], yuv2rgb[2][3] };
|
|
if (!gl->BeginFragmentShader || !gl->EndFragmentShader ||
|
|
!gl->SetFragmentShaderConstant || !gl->SampleMap ||
|
|
!gl->ColorFragmentOp2 || !gl->ColorFragmentOp3) {
|
|
MP_ERR(vo, "Combiner (ATI) functions missing!\n");
|
|
return;
|
|
}
|
|
gl->GetIntegerv(GL_NUM_FRAGMENT_REGISTERS_ATI, &i);
|
|
if (i < 3)
|
|
MP_ERR(vo, "3 registers needed for YUV combiner (ATI) support (found %i)\n", i);
|
|
gl->BeginFragmentShader();
|
|
gl->SetFragmentShaderConstant(GL_CON_0_ATI, c0);
|
|
gl->SetFragmentShaderConstant(GL_CON_1_ATI, c1);
|
|
gl->SetFragmentShaderConstant(GL_CON_2_ATI, c2);
|
|
gl->SetFragmentShaderConstant(GL_CON_3_ATI, c3);
|
|
gl->SampleMap(GL_REG_0_ATI, GL_TEXTURE0, GL_SWIZZLE_STR_ATI);
|
|
gl->SampleMap(GL_REG_1_ATI, GL_TEXTURE1, GL_SWIZZLE_STR_ATI);
|
|
gl->SampleMap(GL_REG_2_ATI, GL_TEXTURE2, GL_SWIZZLE_STR_ATI);
|
|
gl->ColorFragmentOp2(GL_MUL_ATI, GL_REG_1_ATI, GL_NONE, GL_NONE,
|
|
GL_REG_1_ATI, GL_NONE, GL_BIAS_BIT_ATI,
|
|
GL_CON_1_ATI, GL_NONE, GL_BIAS_BIT_ATI);
|
|
gl->ColorFragmentOp3(GL_MAD_ATI, GL_REG_2_ATI, GL_NONE, GL_NONE,
|
|
GL_REG_2_ATI, GL_NONE, GL_BIAS_BIT_ATI,
|
|
GL_CON_2_ATI, GL_NONE, GL_BIAS_BIT_ATI,
|
|
GL_REG_1_ATI, GL_NONE, GL_NONE);
|
|
gl->ColorFragmentOp3(GL_MAD_ATI, GL_REG_0_ATI, GL_NONE, GL_NONE,
|
|
GL_REG_0_ATI, GL_NONE, GL_NONE,
|
|
GL_CON_0_ATI, GL_NONE, GL_BIAS_BIT_ATI,
|
|
GL_REG_2_ATI, GL_NONE, GL_NONE);
|
|
gl->ColorFragmentOp2(GL_ADD_ATI, GL_REG_0_ATI, GL_NONE, GL_8X_BIT_ATI,
|
|
GL_REG_0_ATI, GL_NONE, GL_NONE,
|
|
GL_CON_3_ATI, GL_NONE, GL_BIAS_BIT_ATI);
|
|
gl->EndFragmentShader();
|
|
} else {
|
|
static const char template[] =
|
|
"!!ATIfs1.0\n"
|
|
"StartConstants;\n"
|
|
" CONSTANT c0 = {%e, %e, %e};\n"
|
|
" CONSTANT c1 = {%e, %e, %e};\n"
|
|
" CONSTANT c2 = {%e, %e, %e};\n"
|
|
" CONSTANT c3 = {%e, %e, %e};\n"
|
|
"EndConstants;\n"
|
|
"StartOutputPass;\n"
|
|
" SampleMap r0, t0.str;\n"
|
|
" SampleMap r1, t1.str;\n"
|
|
" SampleMap r2, t2.str;\n"
|
|
" MUL r1.rgb, r1.bias, c1.bias;\n"
|
|
" MAD r2.rgb, r2.bias, c2.bias, r1;\n"
|
|
" MAD r0.rgb, r0, c0.bias, r2;\n"
|
|
" ADD r0.rgb.8x, r0, c3.bias;\n"
|
|
"EndPass;\n";
|
|
char buffer[512];
|
|
snprintf(buffer, sizeof(buffer), template,
|
|
yuv2rgb[0][0], yuv2rgb[1][0], yuv2rgb[2][0],
|
|
yuv2rgb[0][1], yuv2rgb[1][1], yuv2rgb[2][1],
|
|
yuv2rgb[0][2], yuv2rgb[1][2], yuv2rgb[2][2],
|
|
yuv2rgb[0][3], yuv2rgb[1][3], yuv2rgb[2][3]);
|
|
MP_DBG(vo, "generated fragment program:\n%s\n", buffer);
|
|
loadGPUProgram(vo, gl, GL_TEXT_FRAGMENT_SHADER_ATI, buffer);
|
|
}
|
|
}
|
|
|
|
// Replace all occurances of variables named "$"+name (e.g. $foo) in *text with
|
|
// replace, and return the result. *text must have been allocated with talloc.
|
|
static void replace_var_str(char **text, const char *name, const char *replace)
|
|
{
|
|
size_t namelen = strlen(name);
|
|
char *nextvar = *text;
|
|
void *parent = talloc_parent(*text);
|
|
for (;;) {
|
|
nextvar = strchr(nextvar, '$');
|
|
if (!nextvar)
|
|
break;
|
|
char *until = nextvar;
|
|
nextvar++;
|
|
if (strncmp(nextvar, name, namelen) != 0)
|
|
continue;
|
|
nextvar += namelen;
|
|
// try not to replace prefixes of other vars (e.g. $foo vs. $foo_bar)
|
|
char term = nextvar[0];
|
|
if (mp_isalnum(term) || term == '_')
|
|
continue;
|
|
int prelength = until - *text;
|
|
int postlength = nextvar - *text;
|
|
char *n = talloc_asprintf(parent, "%.*s%s%s", prelength, *text, replace,
|
|
nextvar);
|
|
talloc_free(*text);
|
|
*text = n;
|
|
nextvar = *text + postlength;
|
|
}
|
|
}
|
|
|
|
static void replace_var_float(char **text, const char *name, float replace)
|
|
{
|
|
char *s = talloc_asprintf(NULL, "%e", replace);
|
|
replace_var_str(text, name, s);
|
|
talloc_free(s);
|
|
}
|
|
|
|
static void replace_var_char(char **text, const char *name, char replace)
|
|
{
|
|
char s[2] = { replace, '\0' };
|
|
replace_var_str(text, name, s);
|
|
}
|
|
|
|
// Append template to *text. Possibly initialize *text if it's NULL.
|
|
static void append_template(char **text, const char* template)
|
|
{
|
|
if (!*text)
|
|
*text = talloc_strdup(NULL, template);
|
|
else
|
|
*text = talloc_strdup_append(*text, template);
|
|
}
|
|
|
|
/**
|
|
* \brief helper function for gen_spline_lookup_tex
|
|
* \param x subpixel-position ((0,1) range) to calculate weights for
|
|
* \param dst where to store transformed weights, must provide space for 4 GLfloats
|
|
*
|
|
* calculates the weights and stores them after appropriate transformation
|
|
* for the scaler fragment program.
|
|
*/
|
|
static void store_weights(float x, GLfloat *dst)
|
|
{
|
|
float w0 = (((-1 * x + 3) * x - 3) * x + 1) / 6;
|
|
float w1 = (((3 * x - 6) * x + 0) * x + 4) / 6;
|
|
float w2 = (((-3 * x + 3) * x + 3) * x + 1) / 6;
|
|
float w3 = (((1 * x + 0) * x + 0) * x + 0) / 6;
|
|
*dst++ = 1 + x - w1 / (w0 + w1);
|
|
*dst++ = 1 - x + w3 / (w2 + w3);
|
|
*dst++ = w0 + w1;
|
|
*dst++ = 0;
|
|
}
|
|
|
|
//! to avoid artefacts this should be rather large
|
|
#define LOOKUP_BSPLINE_RES (2 * 1024)
|
|
/**
|
|
* \brief creates the 1D lookup texture needed for fast higher-order filtering
|
|
* \param unit texture unit to attach texture to
|
|
*/
|
|
static void gen_spline_lookup_tex(GL *gl, GLenum unit)
|
|
{
|
|
GLfloat *tex = calloc(4 * LOOKUP_BSPLINE_RES, sizeof(*tex));
|
|
GLfloat *tp = tex;
|
|
int i;
|
|
for (i = 0; i < LOOKUP_BSPLINE_RES; i++) {
|
|
float x = (float)(i + 0.5) / LOOKUP_BSPLINE_RES;
|
|
store_weights(x, tp);
|
|
tp += 4;
|
|
}
|
|
store_weights(0, tex);
|
|
store_weights(1, &tex[4 * (LOOKUP_BSPLINE_RES - 1)]);
|
|
gl->ActiveTexture(unit);
|
|
gl->TexImage1D(GL_TEXTURE_1D, 0, GL_RGBA16, LOOKUP_BSPLINE_RES, 0, GL_RGBA,
|
|
GL_FLOAT, tex);
|
|
gl->TexParameterf(GL_TEXTURE_1D, GL_TEXTURE_PRIORITY, 1.0);
|
|
gl->TexParameteri(GL_TEXTURE_1D, GL_TEXTURE_MIN_FILTER, GL_NEAREST);
|
|
gl->TexParameteri(GL_TEXTURE_1D, GL_TEXTURE_MAG_FILTER, GL_NEAREST);
|
|
gl->TexParameteri(GL_TEXTURE_1D, GL_TEXTURE_WRAP_S, GL_REPEAT);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
free(tex);
|
|
}
|
|
|
|
#define NOISE_RES 2048
|
|
|
|
/**
|
|
* \brief creates the 1D lookup texture needed to generate pseudo-random numbers.
|
|
* \param unit texture unit to attach texture to
|
|
*/
|
|
static void gen_noise_lookup_tex(GL *gl, GLenum unit) {
|
|
GLfloat *tex = calloc(NOISE_RES, sizeof(*tex));
|
|
uint32_t lcg = 0x79381c11;
|
|
int i;
|
|
for (i = 0; i < NOISE_RES; i++)
|
|
tex[i] = (double)i / (NOISE_RES - 1);
|
|
for (i = 0; i < NOISE_RES - 1; i++) {
|
|
int remain = NOISE_RES - i;
|
|
int idx = i + (lcg >> 16) % remain;
|
|
GLfloat tmp = tex[i];
|
|
tex[i] = tex[idx];
|
|
tex[idx] = tmp;
|
|
lcg = lcg * 1664525 + 1013904223;
|
|
}
|
|
gl->ActiveTexture(unit);
|
|
gl->TexImage1D(GL_TEXTURE_1D, 0, 1, NOISE_RES, 0, GL_RED, GL_FLOAT, tex);
|
|
gl->TexParameterf(GL_TEXTURE_1D, GL_TEXTURE_PRIORITY, 1.0);
|
|
gl->TexParameteri(GL_TEXTURE_1D, GL_TEXTURE_MIN_FILTER, GL_NEAREST);
|
|
gl->TexParameteri(GL_TEXTURE_1D, GL_TEXTURE_MAG_FILTER, GL_NEAREST);
|
|
gl->TexParameteri(GL_TEXTURE_1D, GL_TEXTURE_WRAP_S, GL_REPEAT);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
free(tex);
|
|
}
|
|
|
|
#define SAMPLE(dest, coord, texture) \
|
|
"TEX textemp, " coord ", " texture ", $tex_type;\n" \
|
|
"MOV " dest ", textemp.r;\n"
|
|
|
|
static const char bilin_filt_template[] =
|
|
SAMPLE("yuv.$out_comp","fragment.texcoord[$in_tex]","texture[$in_tex]");
|
|
|
|
#define BICUB_FILT_MAIN \
|
|
/* first y-interpolation */ \
|
|
"ADD coord, fragment.texcoord[$in_tex].xyxy, cdelta.xyxw;\n" \
|
|
"ADD coord2, fragment.texcoord[$in_tex].xyxy, cdelta.zyzw;\n" \
|
|
SAMPLE("a.r","coord.xyxy","texture[$in_tex]") \
|
|
SAMPLE("a.g","coord.zwzw","texture[$in_tex]") \
|
|
/* second y-interpolation */ \
|
|
SAMPLE("b.r","coord2.xyxy","texture[$in_tex]") \
|
|
SAMPLE("b.g","coord2.zwzw","texture[$in_tex]") \
|
|
"LRP a.b, parmy.b, a.rrrr, a.gggg;\n" \
|
|
"LRP a.a, parmy.b, b.rrrr, b.gggg;\n" \
|
|
/* x-interpolation */ \
|
|
"LRP yuv.$out_comp, parmx.b, a.bbbb, a.aaaa;\n"
|
|
|
|
static const char bicub_filt_template_2D[] =
|
|
"MAD coord.xy, fragment.texcoord[$in_tex], {$texw, $texh}, {0.5, 0.5};\n"
|
|
"TEX parmx, coord.x, texture[$texs], 1D;\n"
|
|
"MUL cdelta.xz, parmx.rrgg, {-$ptw, 0, $ptw, 0};\n"
|
|
"TEX parmy, coord.y, texture[$texs], 1D;\n"
|
|
"MUL cdelta.yw, parmy.rrgg, {0, -$pth, 0, $pth};\n"
|
|
BICUB_FILT_MAIN;
|
|
|
|
static const char bicub_filt_template_RECT[] =
|
|
"ADD coord, fragment.texcoord[$in_tex], {0.5, 0.5};\n"
|
|
"TEX parmx, coord.x, texture[$texs], 1D;\n"
|
|
"MUL cdelta.xz, parmx.rrgg, {-1, 0, 1, 0};\n"
|
|
"TEX parmy, coord.y, texture[$texs], 1D;\n"
|
|
"MUL cdelta.yw, parmy.rrgg, {0, -1, 0, 1};\n"
|
|
BICUB_FILT_MAIN;
|
|
|
|
#define CALCWEIGHTS(t, s) \
|
|
"MAD "t ", {-0.5, 0.1666, 0.3333, -0.3333}, "s ", {1, 0, -0.5, 0.5};\n" \
|
|
"MAD "t ", "t ", "s ", {0, 0, -0.5, 0.5};\n" \
|
|
"MAD "t ", "t ", "s ", {-0.6666, 0, 0.8333, 0.1666};\n" \
|
|
"RCP a.x, "t ".z;\n" \
|
|
"RCP a.y, "t ".w;\n" \
|
|
"MAD "t ".xy, "t ".xyxy, a.xyxy, {1, 1, 0, 0};\n" \
|
|
"ADD "t ".x, "t ".xxxx, "s ";\n" \
|
|
"SUB "t ".y, "t ".yyyy, "s ";\n"
|
|
|
|
static const char bicub_notex_filt_template_2D[] =
|
|
"MAD coord.xy, fragment.texcoord[$in_tex], {$texw, $texh}, {0.5, 0.5};\n"
|
|
"FRC coord.xy, coord.xyxy;\n"
|
|
CALCWEIGHTS("parmx", "coord.xxxx")
|
|
"MUL cdelta.xz, parmx.rrgg, {-$ptw, 0, $ptw, 0};\n"
|
|
CALCWEIGHTS("parmy", "coord.yyyy")
|
|
"MUL cdelta.yw, parmy.rrgg, {0, -$pth, 0, $pth};\n"
|
|
BICUB_FILT_MAIN;
|
|
|
|
static const char bicub_notex_filt_template_RECT[] =
|
|
"ADD coord, fragment.texcoord[$in_tex], {0.5, 0.5};\n"
|
|
"FRC coord.xy, coord.xyxy;\n"
|
|
CALCWEIGHTS("parmx", "coord.xxxx")
|
|
"MUL cdelta.xz, parmx.rrgg, {-1, 0, 1, 0};\n"
|
|
CALCWEIGHTS("parmy", "coord.yyyy")
|
|
"MUL cdelta.yw, parmy.rrgg, {0, -1, 0, 1};\n"
|
|
BICUB_FILT_MAIN;
|
|
|
|
#define BICUB_X_FILT_MAIN \
|
|
"ADD coord.xy, fragment.texcoord[$in_tex].xyxy, cdelta.xyxy;\n" \
|
|
"ADD coord2.xy, fragment.texcoord[$in_tex].xyxy, cdelta.zyzy;\n" \
|
|
SAMPLE("a.r","coord","texture[$in_tex]") \
|
|
SAMPLE("b.r","coord2","texture[$in_tex]") \
|
|
/* x-interpolation */ \
|
|
"LRP yuv.$out_comp, parmx.b, a.rrrr, b.rrrr;\n"
|
|
|
|
static const char bicub_x_filt_template_2D[] =
|
|
"MAD coord.x, fragment.texcoord[$in_tex], {$texw}, {0.5};\n"
|
|
"TEX parmx, coord, texture[$texs], 1D;\n"
|
|
"MUL cdelta.xyz, parmx.rrgg, {-$ptw, 0, $ptw};\n"
|
|
BICUB_X_FILT_MAIN;
|
|
|
|
static const char bicub_x_filt_template_RECT[] =
|
|
"ADD coord.x, fragment.texcoord[$in_tex], {0.5};\n"
|
|
"TEX parmx, coord, texture[$texs], 1D;\n"
|
|
"MUL cdelta.xyz, parmx.rrgg, {-1, 0, 1};\n"
|
|
BICUB_X_FILT_MAIN;
|
|
|
|
static const char unsharp_filt_template[] =
|
|
"PARAM dcoord$out_comp = {$ptw_05, $pth_05, $ptw_05, -$pth_05};\n"
|
|
"ADD coord, fragment.texcoord[$in_tex].xyxy, dcoord$out_comp;\n"
|
|
"SUB coord2, fragment.texcoord[$in_tex].xyxy, dcoord$out_comp;\n"
|
|
SAMPLE("a.r","fragment.texcoord[$in_tex]","texture[$in_tex]")
|
|
SAMPLE("b.r","coord.xyxy","texture[$in_tex]")
|
|
SAMPLE("b.g","coord.zwzw","texture[$in_tex]")
|
|
"ADD b.r, b.r, b.g;\n"
|
|
SAMPLE("b.b","coord2.xyxy","texture[$in_tex]")
|
|
SAMPLE("b.g","coord2.zwzw","texture[$in_tex]")
|
|
"DP3 b, b, {0.25, 0.25, 0.25};\n"
|
|
"SUB b.r, a.r, b.r;\n"
|
|
"MAD textemp.r, b.r, {$strength}, a.r;\n"
|
|
"MOV yuv.$out_comp, textemp.r;\n";
|
|
|
|
static const char unsharp_filt_template2[] =
|
|
"PARAM dcoord$out_comp = {$ptw_12, $pth_12, $ptw_12, -$pth_12};\n"
|
|
"PARAM dcoord2$out_comp = {$ptw_15, 0, 0, $pth_15};\n"
|
|
"ADD coord, fragment.texcoord[$in_tex].xyxy, dcoord$out_comp;\n"
|
|
"SUB coord2, fragment.texcoord[$in_tex].xyxy, dcoord$out_comp;\n"
|
|
SAMPLE("a.r","fragment.texcoord[$in_tex]","texture[$in_tex]")
|
|
SAMPLE("b.r","coord.xyxy","texture[$in_tex]")
|
|
SAMPLE("b.g","coord.zwzw","texture[$in_tex]")
|
|
"ADD b.r, b.r, b.g;\n"
|
|
SAMPLE("b.b","coord2.xyxy","texture[$in_tex]")
|
|
SAMPLE("b.g","coord2.zwzw","texture[$in_tex]")
|
|
"ADD b.r, b.r, b.b;\n"
|
|
"ADD b.a, b.r, b.g;\n"
|
|
"ADD coord, fragment.texcoord[$in_tex].xyxy, dcoord2$out_comp;\n"
|
|
"SUB coord2, fragment.texcoord[$in_tex].xyxy, dcoord2$out_comp;\n"
|
|
SAMPLE("b.r","coord.xyxy","texture[$in_tex]")
|
|
SAMPLE("b.g","coord.zwzw","texture[$in_tex]")
|
|
"ADD b.r, b.r, b.g;\n"
|
|
SAMPLE("b.b","coord2.xyxy","texture[$in_tex]")
|
|
SAMPLE("b.g","coord2.zwzw","texture[$in_tex]")
|
|
"DP4 b.r, b, {-0.1171875, -0.1171875, -0.1171875, -0.09765625};\n"
|
|
"MAD b.r, a.r, {0.859375}, b.r;\n"
|
|
"MAD textemp.r, b.r, {$strength}, a.r;\n"
|
|
"MOV yuv.$out_comp, textemp.r;\n";
|
|
|
|
static const char yuv_prog_template[] =
|
|
"PARAM ycoef = {$cm11, $cm21, $cm31};\n"
|
|
"PARAM ucoef = {$cm12, $cm22, $cm32};\n"
|
|
"PARAM vcoef = {$cm13, $cm23, $cm33};\n"
|
|
"PARAM offsets = {$cm14, $cm24, $cm34};\n"
|
|
"TEMP res;\n"
|
|
"MAD res.rgb, yuv.rrrr, ycoef, offsets;\n"
|
|
"MAD res.rgb, yuv.gggg, ucoef, res;\n"
|
|
"MAD res.rgb, yuv.bbbb, vcoef, res;\n";
|
|
|
|
static const char yuv_pow_prog_template[] =
|
|
"PARAM ycoef = {$cm11, $cm21, $cm31};\n"
|
|
"PARAM ucoef = {$cm12, $cm22, $cm32};\n"
|
|
"PARAM vcoef = {$cm13, $cm23, $cm33};\n"
|
|
"PARAM offsets = {$cm14, $cm24, $cm34};\n"
|
|
"PARAM gamma = {$gamma_r, $gamma_g, $gamma_b};\n"
|
|
"TEMP res;\n"
|
|
"MAD res.rgb, yuv.rrrr, ycoef, offsets;\n"
|
|
"MAD res.rgb, yuv.gggg, ucoef, res;\n"
|
|
"MAD_SAT res.rgb, yuv.bbbb, vcoef, res;\n"
|
|
"POW res.r, res.r, gamma.r;\n"
|
|
"POW res.g, res.g, gamma.g;\n"
|
|
"POW res.b, res.b, gamma.b;\n";
|
|
|
|
static const char yuv_lookup_prog_template[] =
|
|
"PARAM ycoef = {$cm11, $cm21, $cm31, 0};\n"
|
|
"PARAM ucoef = {$cm12, $cm22, $cm32, 0};\n"
|
|
"PARAM vcoef = {$cm13, $cm23, $cm33, 0};\n"
|
|
"PARAM offsets = {$cm14, $cm24, $cm34, 0.125};\n"
|
|
"TEMP res;\n"
|
|
"MAD res, yuv.rrrr, ycoef, offsets;\n"
|
|
"MAD res.rgb, yuv.gggg, ucoef, res;\n"
|
|
"MAD res.rgb, yuv.bbbb, vcoef, res;\n"
|
|
"TEX res.r, res.raaa, texture[$conv_tex0], 2D;\n"
|
|
"ADD res.a, res.a, 0.25;\n"
|
|
"TEX res.g, res.gaaa, texture[$conv_tex0], 2D;\n"
|
|
"ADD res.a, res.a, 0.25;\n"
|
|
"TEX res.b, res.baaa, texture[$conv_tex0], 2D;\n";
|
|
|
|
static const char yuv_lookup3d_prog_template[] =
|
|
"TEMP res;\n"
|
|
"TEX res, yuv, texture[$conv_tex0], 3D;\n";
|
|
|
|
static const char noise_filt_template[] =
|
|
"MUL coord.xy, fragment.texcoord[0], {$noise_sx, $noise_sy};\n"
|
|
"TEMP rand;\n"
|
|
"TEX rand.r, coord.x, texture[$noise_filt_tex], 1D;\n"
|
|
"ADD rand.r, rand.r, coord.y;\n"
|
|
"TEX rand.r, rand.r, texture[$noise_filt_tex], 1D;\n"
|
|
"MAD res.rgb, rand.rrrr, {$noise_str, $noise_str, $noise_str}, res;\n";
|
|
|
|
/**
|
|
* \brief creates and initializes helper textures needed for scaling texture read
|
|
* \param scaler scaler type to create texture for
|
|
* \param texu contains next free texture unit number
|
|
* \param texs texture unit ids for the scaler are stored in this array
|
|
*/
|
|
static void create_scaler_textures(struct vo *vo, GL *gl, int scaler, int *texu,
|
|
char *texs)
|
|
{
|
|
switch (scaler) {
|
|
case YUV_SCALER_BILIN:
|
|
case YUV_SCALER_BICUB_NOTEX:
|
|
case YUV_SCALER_UNSHARP:
|
|
case YUV_SCALER_UNSHARP2:
|
|
break;
|
|
case YUV_SCALER_BICUB:
|
|
case YUV_SCALER_BICUB_X:
|
|
texs[0] = (*texu)++;
|
|
gen_spline_lookup_tex(gl, GL_TEXTURE0 + texs[0]);
|
|
texs[0] += '0';
|
|
break;
|
|
default:
|
|
MP_ERR(vo, "unknown scaler type %i\n", scaler);
|
|
}
|
|
}
|
|
|
|
//! resolution of texture for gamma lookup table
|
|
#define LOOKUP_RES 512
|
|
//! resolution for 3D yuv->rgb conversion lookup table
|
|
#define LOOKUP_3DRES 32
|
|
/**
|
|
* \brief creates and initializes helper textures needed for yuv conversion
|
|
* \param params struct containing parameters like brightness, gamma, ...
|
|
* \param texu contains next free texture unit number
|
|
* \param texs texture unit ids for the conversion are stored in this array
|
|
*/
|
|
static void create_conv_textures(struct vo *vo, GL *gl,
|
|
gl_conversion_params_t *params,
|
|
int *texu, char *texs)
|
|
{
|
|
unsigned char *lookup_data = NULL;
|
|
int conv = YUV_CONVERSION(params->type);
|
|
switch (conv) {
|
|
case YUV_CONVERSION_FRAGMENT:
|
|
case YUV_CONVERSION_FRAGMENT_POW:
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP:
|
|
texs[0] = (*texu)++;
|
|
gl->ActiveTexture(GL_TEXTURE0 + texs[0]);
|
|
lookup_data = malloc(4 * LOOKUP_RES);
|
|
mp_gen_gamma_map(lookup_data, LOOKUP_RES, params->csp_params.rgamma);
|
|
mp_gen_gamma_map(&lookup_data[LOOKUP_RES], LOOKUP_RES,
|
|
params->csp_params.ggamma);
|
|
mp_gen_gamma_map(&lookup_data[2 * LOOKUP_RES], LOOKUP_RES,
|
|
params->csp_params.bgamma);
|
|
glCreateClearTex(gl, GL_TEXTURE_2D, GL_LUMINANCE8, GL_LUMINANCE,
|
|
GL_UNSIGNED_BYTE, GL_LINEAR, LOOKUP_RES, 4, 0);
|
|
glUploadTex(gl, GL_TEXTURE_2D, GL_LUMINANCE, GL_UNSIGNED_BYTE,
|
|
lookup_data, LOOKUP_RES, 0, 0, LOOKUP_RES, 4, 0);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
texs[0] += '0';
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP3D:
|
|
{
|
|
int sz = LOOKUP_3DRES + 2; // texture size including borders
|
|
if (!gl->TexImage3D) {
|
|
MP_ERR(vo, "Missing 3D texture function!\n");
|
|
break;
|
|
}
|
|
texs[0] = (*texu)++;
|
|
gl->ActiveTexture(GL_TEXTURE0 + texs[0]);
|
|
lookup_data = malloc(3 * sz * sz * sz);
|
|
mp_gen_yuv2rgb_map(¶ms->csp_params, lookup_data, LOOKUP_3DRES);
|
|
glAdjustAlignment(gl, sz);
|
|
gl->PixelStorei(GL_UNPACK_ROW_LENGTH, 0);
|
|
gl->TexImage3D(GL_TEXTURE_3D, 0, 3, sz, sz, sz, 1,
|
|
GL_RGB, GL_UNSIGNED_BYTE, lookup_data);
|
|
gl->TexParameterf(GL_TEXTURE_3D, GL_TEXTURE_PRIORITY, 1.0);
|
|
gl->TexParameteri(GL_TEXTURE_3D, GL_TEXTURE_MIN_FILTER, GL_LINEAR);
|
|
gl->TexParameteri(GL_TEXTURE_3D, GL_TEXTURE_MAG_FILTER, GL_LINEAR);
|
|
gl->TexParameteri(GL_TEXTURE_3D, GL_TEXTURE_WRAP_S, GL_CLAMP);
|
|
gl->TexParameteri(GL_TEXTURE_3D, GL_TEXTURE_WRAP_T, GL_CLAMP);
|
|
gl->TexParameteri(GL_TEXTURE_3D, GL_TEXTURE_WRAP_R, GL_CLAMP);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
texs[0] += '0';
|
|
}
|
|
break;
|
|
default:
|
|
MP_ERR(vo, "unknown conversion type %i\n", conv);
|
|
}
|
|
free(lookup_data);
|
|
}
|
|
|
|
/**
|
|
* \brief adds a scaling texture read at the current fragment program position
|
|
* \param scaler type of scaler to insert
|
|
* \param prog pointer to fragment program so far
|
|
* \param texs array containing the texture unit identifiers for this scaler
|
|
* \param in_tex texture unit the scaler should read from
|
|
* \param out_comp component of the yuv variable the scaler stores the result in
|
|
* \param rect if rectangular (pixel) adressing should be used for in_tex
|
|
* \param texw width of the in_tex texture
|
|
* \param texh height of the in_tex texture
|
|
* \param strength strength of filter effect if the scaler does some kind of filtering
|
|
*/
|
|
static void add_scaler(int scaler, char **prog, char *texs,
|
|
char in_tex, char out_comp, int rect, int texw, int texh,
|
|
double strength)
|
|
{
|
|
const char *ttype = rect ? "RECT" : "2D";
|
|
const float ptw = rect ? 1.0 : 1.0 / texw;
|
|
const float pth = rect ? 1.0 : 1.0 / texh;
|
|
switch (scaler) {
|
|
case YUV_SCALER_BILIN:
|
|
append_template(prog, bilin_filt_template);
|
|
break;
|
|
case YUV_SCALER_BICUB:
|
|
if (rect)
|
|
append_template(prog, bicub_filt_template_RECT);
|
|
else
|
|
append_template(prog, bicub_filt_template_2D);
|
|
break;
|
|
case YUV_SCALER_BICUB_X:
|
|
if (rect)
|
|
append_template(prog, bicub_x_filt_template_RECT);
|
|
else
|
|
append_template(prog, bicub_x_filt_template_2D);
|
|
break;
|
|
case YUV_SCALER_BICUB_NOTEX:
|
|
if (rect)
|
|
append_template(prog, bicub_notex_filt_template_RECT);
|
|
else
|
|
append_template(prog, bicub_notex_filt_template_2D);
|
|
break;
|
|
case YUV_SCALER_UNSHARP:
|
|
append_template(prog, unsharp_filt_template);
|
|
break;
|
|
case YUV_SCALER_UNSHARP2:
|
|
append_template(prog, unsharp_filt_template2);
|
|
break;
|
|
}
|
|
|
|
replace_var_char(prog, "texs", texs[0]);
|
|
replace_var_char(prog, "in_tex", in_tex);
|
|
replace_var_char(prog, "out_comp", out_comp);
|
|
replace_var_str(prog, "tex_type", ttype);
|
|
replace_var_float(prog, "texw", texw);
|
|
replace_var_float(prog, "texh", texh);
|
|
replace_var_float(prog, "ptw", ptw);
|
|
replace_var_float(prog, "pth", pth);
|
|
|
|
// this is silly, not sure if that couldn't be in the shader source instead
|
|
replace_var_float(prog, "ptw_05", ptw * 0.5);
|
|
replace_var_float(prog, "pth_05", pth * 0.5);
|
|
replace_var_float(prog, "ptw_15", ptw * 1.5);
|
|
replace_var_float(prog, "pth_15", pth * 1.5);
|
|
replace_var_float(prog, "ptw_12", ptw * 1.2);
|
|
replace_var_float(prog, "pth_12", pth * 1.2);
|
|
|
|
replace_var_float(prog, "strength", strength);
|
|
}
|
|
|
|
static const struct {
|
|
const char *name;
|
|
GLenum cur;
|
|
GLenum max;
|
|
} progstats[] = {
|
|
{"instructions", 0x88A0, 0x88A1},
|
|
{"native instructions", 0x88A2, 0x88A3},
|
|
{"temporaries", 0x88A4, 0x88A5},
|
|
{"native temporaries", 0x88A6, 0x88A7},
|
|
{"parameters", 0x88A8, 0x88A9},
|
|
{"native parameters", 0x88AA, 0x88AB},
|
|
{"attribs", 0x88AC, 0x88AD},
|
|
{"native attribs", 0x88AE, 0x88AF},
|
|
{"ALU instructions", 0x8805, 0x880B},
|
|
{"TEX instructions", 0x8806, 0x880C},
|
|
{"TEX indirections", 0x8807, 0x880D},
|
|
{"native ALU instructions", 0x8808, 0x880E},
|
|
{"native TEX instructions", 0x8809, 0x880F},
|
|
{"native TEX indirections", 0x880A, 0x8810},
|
|
{NULL, 0, 0}
|
|
};
|
|
|
|
/**
|
|
* \brief load the specified GPU Program
|
|
* \param target program target to load into, only GL_FRAGMENT_PROGRAM is tested
|
|
* \param prog program string
|
|
* \return 1 on success, 0 otherwise
|
|
*/
|
|
static int loadGPUProgram(struct vo *vo, GL *gl, GLenum target, char *prog)
|
|
{
|
|
int i;
|
|
GLint cur = 0, max = 0, err = 0;
|
|
if (!gl->ProgramString) {
|
|
MP_ERR(vo, "Missing GPU program function\n");
|
|
return 0;
|
|
}
|
|
gl->ProgramString(target, GL_PROGRAM_FORMAT_ASCII, strlen(prog), prog);
|
|
gl->GetIntegerv(GL_PROGRAM_ERROR_POSITION, &err);
|
|
if (err != -1) {
|
|
MP_ERR(vo,
|
|
"Error compiling fragment program, make sure your card supports\n"
|
|
" GL_ARB_fragment_program (use glxinfo to check).\n"
|
|
" Error message:\n %s at %.10s\n",
|
|
gl->GetString(GL_PROGRAM_ERROR_STRING), &prog[err]);
|
|
return 0;
|
|
}
|
|
if (!gl->GetProgramivARB)
|
|
return 1;
|
|
MP_VERBOSE(vo, "Program statistics:\n");
|
|
for (i = 0; progstats[i].name; i++) {
|
|
gl->GetProgramivARB(target, progstats[i].cur, &cur);
|
|
gl->GetProgramivARB(target, progstats[i].max, &max);
|
|
MP_VERBOSE(vo, " %s: %i/%i\n", progstats[i].name, cur, max);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
#define MAX_PROGSZ (1024 * 1024)
|
|
|
|
/**
|
|
* \brief setup a fragment program that will do YUV->RGB conversion
|
|
* \param parms struct containing parameters like conversion and scaler type,
|
|
* brightness, ...
|
|
*/
|
|
static void glSetupYUVFragprog(struct vo *vo, GL *gl,
|
|
gl_conversion_params_t *params)
|
|
{
|
|
int type = params->type;
|
|
int texw = params->texw;
|
|
int texh = params->texh;
|
|
int rect = params->target == GL_TEXTURE_RECTANGLE;
|
|
static const char prog_hdr[] =
|
|
"!!ARBfp1.0\n"
|
|
"OPTION ARB_precision_hint_fastest;\n"
|
|
// all scaler variables must go here so they aren't defined
|
|
// multiple times when the same scaler is used more than once
|
|
"TEMP coord, coord2, cdelta, parmx, parmy, a, b, yuv, textemp;\n";
|
|
char *yuv_prog = NULL;
|
|
char **prog = &yuv_prog;
|
|
int cur_texu = 3;
|
|
char lum_scale_texs[1] = {0};
|
|
char chrom_scale_texs[1] = {0};
|
|
char conv_texs[1];
|
|
char filt_texs[1] = {0};
|
|
GLint i;
|
|
// this is the conversion matrix, with y, u, v factors
|
|
// for red, green, blue and the constant offsets
|
|
float yuv2rgb[3][4];
|
|
int noise = params->noise_strength != 0;
|
|
create_conv_textures(vo, gl, params, &cur_texu, conv_texs);
|
|
create_scaler_textures(vo, gl, YUV_LUM_SCALER(type), &cur_texu, lum_scale_texs);
|
|
if (YUV_CHROM_SCALER(type) == YUV_LUM_SCALER(type))
|
|
memcpy(chrom_scale_texs, lum_scale_texs, sizeof(chrom_scale_texs));
|
|
else
|
|
create_scaler_textures(vo, gl, YUV_CHROM_SCALER(type), &cur_texu,
|
|
chrom_scale_texs);
|
|
|
|
if (noise) {
|
|
gen_noise_lookup_tex(gl, cur_texu);
|
|
filt_texs[0] = '0' + cur_texu++;
|
|
}
|
|
|
|
gl->GetIntegerv(GL_MAX_TEXTURE_IMAGE_UNITS, &i);
|
|
if (i < cur_texu)
|
|
MP_ERR(vo, "%i texture units needed for this type of YUV fragment support (found %i)\n",
|
|
cur_texu, i);
|
|
if (!gl->ProgramString) {
|
|
MP_FATAL(vo, "ProgramString function missing!\n");
|
|
return;
|
|
}
|
|
append_template(prog, prog_hdr);
|
|
add_scaler(YUV_LUM_SCALER(type), prog, lum_scale_texs,
|
|
'0', 'r', rect, texw, texh, params->filter_strength);
|
|
add_scaler(YUV_CHROM_SCALER(type), prog,
|
|
chrom_scale_texs, '1', 'g', rect, params->chrom_texw,
|
|
params->chrom_texh, params->filter_strength);
|
|
add_scaler(YUV_CHROM_SCALER(type), prog,
|
|
chrom_scale_texs, '2', 'b', rect, params->chrom_texw,
|
|
params->chrom_texh, params->filter_strength);
|
|
mp_get_yuv2rgb_coeffs(¶ms->csp_params, yuv2rgb);
|
|
switch (YUV_CONVERSION(type)) {
|
|
case YUV_CONVERSION_FRAGMENT:
|
|
append_template(prog, yuv_prog_template);
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_POW:
|
|
append_template(prog, yuv_pow_prog_template);
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP:
|
|
append_template(prog, yuv_lookup_prog_template);
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP3D:
|
|
append_template(prog, yuv_lookup3d_prog_template);
|
|
break;
|
|
default:
|
|
MP_ERR(vo, "unknown conversion type %i\n", YUV_CONVERSION(type));
|
|
break;
|
|
}
|
|
for (int r = 0; r < 3; r++) {
|
|
for (int c = 0; c < 4; c++) {
|
|
// "cmRC"
|
|
char var[] = { 'c', 'm', '1' + r, '1' + c, '\0' };
|
|
replace_var_float(prog, var, yuv2rgb[r][c]);
|
|
}
|
|
}
|
|
replace_var_float(prog, "gamma_r", (float)1.0 / params->csp_params.rgamma);
|
|
replace_var_float(prog, "gamma_g", (float)1.0 / params->csp_params.ggamma);
|
|
replace_var_float(prog, "gamma_b", (float)1.0 / params->csp_params.bgamma);
|
|
replace_var_char(prog, "conv_tex0", conv_texs[0]);
|
|
|
|
if (noise) {
|
|
// 1.0 strength is suitable for dithering 8 to 6 bit
|
|
double str = params->noise_strength * (1.0 / 64);
|
|
double scale_x = (double)NOISE_RES / texw;
|
|
double scale_y = (double)NOISE_RES / texh;
|
|
if (rect) {
|
|
scale_x /= texw;
|
|
scale_y /= texh;
|
|
}
|
|
append_template(prog, noise_filt_template);
|
|
replace_var_float(prog, "noise_sx", scale_x);
|
|
replace_var_float(prog, "noise_sy", scale_y);
|
|
replace_var_char(prog, "noise_filt_tex", filt_texs[0]);
|
|
replace_var_float(prog, "noise_str", str);
|
|
}
|
|
|
|
append_template(prog, "MOV result.color.rgb, res;\nEND");
|
|
|
|
MP_DBG(vo, "generated fragment program:\n%s\n", yuv_prog);
|
|
loadGPUProgram(vo, gl, GL_FRAGMENT_PROGRAM, yuv_prog);
|
|
talloc_free(yuv_prog);
|
|
}
|
|
|
|
/**
|
|
* \brief detect the best YUV->RGB conversion method available
|
|
*/
|
|
static int glAutodetectYUVConversion(GL *gl)
|
|
{
|
|
const char *extensions = gl->GetString(GL_EXTENSIONS);
|
|
if (!extensions || !gl->MultiTexCoord2f)
|
|
return YUV_CONVERSION_NONE;
|
|
if (strstr(extensions, "GL_ARB_fragment_program"))
|
|
return YUV_CONVERSION_FRAGMENT;
|
|
if (strstr(extensions, "GL_ATI_text_fragment_shader"))
|
|
return YUV_CONVERSION_TEXT_FRAGMENT;
|
|
if (strstr(extensions, "GL_ATI_fragment_shader"))
|
|
return YUV_CONVERSION_COMBINERS_ATI;
|
|
return YUV_CONVERSION_NONE;
|
|
}
|
|
|
|
/**
|
|
* \brief setup YUV->RGB conversion
|
|
* \param parms struct containing parameters like conversion and scaler type,
|
|
* brightness, ...
|
|
* \ingroup glconversion
|
|
*/
|
|
static void glSetupYUVConversion(struct vo *vo, GL *gl,
|
|
gl_conversion_params_t *params)
|
|
{
|
|
if (params->chrom_texw == 0)
|
|
params->chrom_texw = 1;
|
|
if (params->chrom_texh == 0)
|
|
params->chrom_texh = 1;
|
|
switch (YUV_CONVERSION(params->type)) {
|
|
case YUV_CONVERSION_COMBINERS_ATI:
|
|
glSetupYUVFragmentATI(vo, gl, ¶ms->csp_params, 0);
|
|
break;
|
|
case YUV_CONVERSION_TEXT_FRAGMENT:
|
|
glSetupYUVFragmentATI(vo, gl, ¶ms->csp_params, 1);
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP:
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP3D:
|
|
case YUV_CONVERSION_FRAGMENT:
|
|
case YUV_CONVERSION_FRAGMENT_POW:
|
|
glSetupYUVFragprog(vo, gl, params);
|
|
break;
|
|
case YUV_CONVERSION_NONE:
|
|
break;
|
|
default:
|
|
MP_ERR(vo, "unknown conversion type %i\n", YUV_CONVERSION(params->type));
|
|
}
|
|
}
|
|
|
|
/**
|
|
* \brief enable the specified YUV conversion
|
|
* \param target texture target for Y, U and V textures (e.g. GL_TEXTURE_2D)
|
|
* \param type type of YUV conversion
|
|
* \ingroup glconversion
|
|
*/
|
|
static void glEnableYUVConversion(GL *gl, GLenum target, int type)
|
|
{
|
|
switch (YUV_CONVERSION(type)) {
|
|
case YUV_CONVERSION_COMBINERS_ATI:
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
gl->Enable(target);
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
gl->Enable(target);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
gl->Enable(GL_FRAGMENT_SHADER_ATI);
|
|
break;
|
|
case YUV_CONVERSION_TEXT_FRAGMENT:
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
gl->Enable(target);
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
gl->Enable(target);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
gl->Enable(GL_TEXT_FRAGMENT_SHADER_ATI);
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP3D:
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP:
|
|
case YUV_CONVERSION_FRAGMENT_POW:
|
|
case YUV_CONVERSION_FRAGMENT:
|
|
case YUV_CONVERSION_NONE:
|
|
gl->Enable(GL_FRAGMENT_PROGRAM);
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* \brief disable the specified YUV conversion
|
|
* \param target texture target for Y, U and V textures (e.g. GL_TEXTURE_2D)
|
|
* \param type type of YUV conversion
|
|
* \ingroup glconversion
|
|
*/
|
|
static void glDisableYUVConversion(GL *gl, GLenum target, int type)
|
|
{
|
|
switch (YUV_CONVERSION(type)) {
|
|
case YUV_CONVERSION_COMBINERS_ATI:
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
gl->Disable(target);
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
gl->Disable(target);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
gl->Disable(GL_FRAGMENT_SHADER_ATI);
|
|
break;
|
|
case YUV_CONVERSION_TEXT_FRAGMENT:
|
|
gl->Disable(GL_TEXT_FRAGMENT_SHADER_ATI);
|
|
// HACK: at least the Mac OS X 10.5 PPC Radeon drivers are broken and
|
|
// without this disable the texture units while the program is still
|
|
// running (10.4 PPC seems to work without this though).
|
|
gl->Flush();
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
gl->Disable(target);
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
gl->Disable(target);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
break;
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP3D:
|
|
case YUV_CONVERSION_FRAGMENT_LOOKUP:
|
|
case YUV_CONVERSION_FRAGMENT_POW:
|
|
case YUV_CONVERSION_FRAGMENT:
|
|
case YUV_CONVERSION_NONE:
|
|
gl->Disable(GL_FRAGMENT_PROGRAM);
|
|
break;
|
|
}
|
|
}
|
|
|
|
|
|
/**
|
|
* \brief draw a texture part at given 2D coordinates
|
|
* \param x screen top coordinate
|
|
* \param y screen left coordinate
|
|
* \param w screen width coordinate
|
|
* \param h screen height coordinate
|
|
* \param tx texture top coordinate in pixels
|
|
* \param ty texture left coordinate in pixels
|
|
* \param tw texture part width in pixels
|
|
* \param th texture part height in pixels
|
|
* \param sx width of texture in pixels
|
|
* \param sy height of texture in pixels
|
|
* \param rect_tex whether this texture uses texture_rectangle extension
|
|
* \param is_yv12 if != 0, also draw the textures from units 1 and 2,
|
|
* bits 8 - 15 and 16 - 23 specify the x and y scaling of those textures
|
|
* \param flip flip the texture upside down
|
|
* \ingroup gltexture
|
|
*/
|
|
static void glDrawTex(GL *gl, GLfloat x, GLfloat y, GLfloat w, GLfloat h,
|
|
GLfloat tx, GLfloat ty, GLfloat tw, GLfloat th,
|
|
int sx, int sy, int rect_tex, int is_yv12, int flip)
|
|
{
|
|
int chroma_x_shift = (is_yv12 >> 8) & 31;
|
|
int chroma_y_shift = (is_yv12 >> 16) & 31;
|
|
GLfloat xscale = 1 << chroma_x_shift;
|
|
GLfloat yscale = 1 << chroma_y_shift;
|
|
GLfloat tx2 = tx / xscale, ty2 = ty / yscale, tw2 = tw / xscale, th2 = th / yscale;
|
|
if (!rect_tex) {
|
|
tx /= sx;
|
|
ty /= sy;
|
|
tw /= sx;
|
|
th /= sy;
|
|
tx2 = tx, ty2 = ty, tw2 = tw, th2 = th;
|
|
}
|
|
if (flip) {
|
|
y += h;
|
|
h = -h;
|
|
}
|
|
gl->Begin(GL_QUADS);
|
|
gl->TexCoord2f(tx, ty);
|
|
if (is_yv12) {
|
|
gl->MultiTexCoord2f(GL_TEXTURE1, tx2, ty2);
|
|
gl->MultiTexCoord2f(GL_TEXTURE2, tx2, ty2);
|
|
}
|
|
gl->Vertex2f(x, y);
|
|
gl->TexCoord2f(tx, ty + th);
|
|
if (is_yv12) {
|
|
gl->MultiTexCoord2f(GL_TEXTURE1, tx2, ty2 + th2);
|
|
gl->MultiTexCoord2f(GL_TEXTURE2, tx2, ty2 + th2);
|
|
}
|
|
gl->Vertex2f(x, y + h);
|
|
gl->TexCoord2f(tx + tw, ty + th);
|
|
if (is_yv12) {
|
|
gl->MultiTexCoord2f(GL_TEXTURE1, tx2 + tw2, ty2 + th2);
|
|
gl->MultiTexCoord2f(GL_TEXTURE2, tx2 + tw2, ty2 + th2);
|
|
}
|
|
gl->Vertex2f(x + w, y + h);
|
|
gl->TexCoord2f(tx + tw, ty);
|
|
if (is_yv12) {
|
|
gl->MultiTexCoord2f(GL_TEXTURE1, tx2 + tw2, ty2);
|
|
gl->MultiTexCoord2f(GL_TEXTURE2, tx2 + tw2, ty2);
|
|
}
|
|
gl->Vertex2f(x + w, y);
|
|
gl->End();
|
|
}
|
|
|
|
static void resize(struct vo *vo, int x, int y)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
MP_VERBOSE(vo, "Resize: %dx%d\n", x, y);
|
|
gl->Viewport(0, 0, x, y);
|
|
|
|
vo_get_src_dst_rects(vo, &p->src_rect, &p->dst_rect, &p->osd_res);
|
|
|
|
gl->MatrixMode(GL_MODELVIEW);
|
|
gl->LoadIdentity();
|
|
gl->Ortho(0, vo->dwidth, vo->dheight, 0, -1, 1);
|
|
|
|
gl->Clear(GL_COLOR_BUFFER_BIT);
|
|
vo->want_redraw = true;
|
|
}
|
|
|
|
static void texSize(struct vo *vo, int w, int h, int *texw, int *texh)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
if (p->use_rectangle) {
|
|
*texw = w;
|
|
*texh = h;
|
|
} else {
|
|
*texw = 32;
|
|
while (*texw < w)
|
|
*texw *= 2;
|
|
*texh = 32;
|
|
while (*texh < h)
|
|
*texh *= 2;
|
|
}
|
|
if (p->ati_hack)
|
|
*texw = (*texw + 511) & ~511;
|
|
}
|
|
|
|
//! maximum size of custom fragment program
|
|
#define MAX_CUSTOM_PROG_SIZE (1024 * 1024)
|
|
static void update_yuvconv(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
if (!vo->params)
|
|
return;
|
|
|
|
struct mp_csp_params cparams = { .colorspace = MP_CSP_DETAILS_DEFAULTS };
|
|
cparams.colorspace.format = vo->params->colorspace;
|
|
cparams.colorspace.levels_in = vo->params->colorlevels;
|
|
cparams.colorspace.levels_out = vo->params->outputlevels;
|
|
mp_csp_copy_equalizer_values(&cparams, &p->video_eq);
|
|
gl_conversion_params_t params = {
|
|
p->target, p->yuvconvtype, cparams,
|
|
p->texture_width, p->texture_height, 0, 0, p->filter_strength,
|
|
p->noise_strength
|
|
};
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(p->image_format);
|
|
int depth = desc.plane_bits;
|
|
params.chrom_texw = params.texw >> desc.chroma_xs;
|
|
params.chrom_texh = params.texh >> desc.chroma_ys;
|
|
params.csp_params.input_bits = depth;
|
|
params.csp_params.texture_bits = depth+7 & ~7;
|
|
glSetupYUVConversion(vo, gl, ¶ms);
|
|
if (p->custom_prog) {
|
|
FILE *f = fopen(p->custom_prog, "rb");
|
|
if (!f) {
|
|
MP_WARN(vo, "Could not read customprog %s\n", p->custom_prog);
|
|
} else {
|
|
char *prog = calloc(1, MAX_CUSTOM_PROG_SIZE + 1);
|
|
fread(prog, 1, MAX_CUSTOM_PROG_SIZE, f);
|
|
fclose(f);
|
|
loadGPUProgram(vo, gl, GL_FRAGMENT_PROGRAM, prog);
|
|
free(prog);
|
|
}
|
|
gl->ProgramEnvParameter4f(GL_FRAGMENT_PROGRAM, 0,
|
|
1.0 / p->texture_width,
|
|
1.0 / p->texture_height,
|
|
p->texture_width, p->texture_height);
|
|
}
|
|
if (p->custom_tex) {
|
|
FILE *f = fopen(p->custom_tex, "rb");
|
|
if (!f) {
|
|
MP_WARN(vo, "Could not read customtex %s\n", p->custom_tex);
|
|
} else {
|
|
int width, height, maxval;
|
|
gl->ActiveTexture(GL_TEXTURE3);
|
|
if (glCreatePPMTex(gl, p->custom_trect ? GL_TEXTURE_RECTANGLE : GL_TEXTURE_2D,
|
|
0, p->custom_tlin ? GL_LINEAR : GL_NEAREST,
|
|
f, &width, &height, &maxval)) {
|
|
gl->ProgramEnvParameter4f(GL_FRAGMENT_PROGRAM, 1,
|
|
1.0 / width, 1.0 / height,
|
|
width, height);
|
|
} else
|
|
MP_WARN(vo, "Error parsing customtex %s\n", p->custom_tex);
|
|
fclose(f);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
}
|
|
}
|
|
}
|
|
|
|
static void draw_osd(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
if (!p->osd)
|
|
return;
|
|
|
|
struct mp_osd_res res = p->osd_res;
|
|
|
|
if (p->scaled_osd) {
|
|
res = osd_res_from_image_params(vo->params);
|
|
gl->MatrixMode(GL_MODELVIEW);
|
|
gl->PushMatrix();
|
|
// Setup image space -> screen space (assumes osd_res in screen space)
|
|
int w = vo->dwidth - (p->osd_res.mr + p->osd_res.ml);
|
|
int h = vo->dheight - (p->osd_res.mt + p->osd_res.mb);
|
|
gl->Translated(p->osd_res.mr, p->osd_res.mt, 0);
|
|
gl->Scaled(1.0 / res.w * w, 1.0 / res.h * h, 1);
|
|
}
|
|
|
|
gl->Color4ub((p->osd_color >> 16) & 0xff, (p->osd_color >> 8) & 0xff,
|
|
p->osd_color & 0xff, 0xff - (p->osd_color >> 24));
|
|
|
|
mpgl_osd_draw_legacy(p->osd, p->osd_pts, res);
|
|
|
|
if (p->scaled_osd)
|
|
gl->PopMatrix();
|
|
}
|
|
|
|
/**
|
|
* \brief uninitialize OpenGL context, freeing textures, buffers etc.
|
|
*/
|
|
static void uninitGl(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
if (!gl)
|
|
return;
|
|
|
|
int i = 0;
|
|
if (gl->DeletePrograms && p->fragprog)
|
|
gl->DeletePrograms(1, &p->fragprog);
|
|
p->fragprog = 0;
|
|
while (p->default_texs[i] != 0)
|
|
i++;
|
|
if (i)
|
|
gl->DeleteTextures(i, p->default_texs);
|
|
p->default_texs[0] = 0;
|
|
if (p->osd)
|
|
mpgl_osd_destroy(p->osd);
|
|
p->osd = NULL;
|
|
p->buffer = 0;
|
|
p->buffersize = 0;
|
|
p->bufferptr = NULL;
|
|
if (gl->DeleteBuffers && p->buffer_uv[0])
|
|
gl->DeleteBuffers(2, p->buffer_uv);
|
|
p->buffer_uv[0] = p->buffer_uv[1] = 0;
|
|
p->buffersize_uv = 0;
|
|
p->bufferptr_uv[0] = p->bufferptr_uv[1] = 0;
|
|
p->err_shown = 0;
|
|
}
|
|
|
|
static void autodetectGlExtensions(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
const char *extensions = gl->GetString(GL_EXTENSIONS);
|
|
const char *vendor = gl->GetString(GL_VENDOR);
|
|
const char *version = gl->GetString(GL_VERSION);
|
|
const char *renderer = gl->GetString(GL_RENDERER);
|
|
int is_ati = vendor && strstr(vendor, "ATI") != NULL;
|
|
int ati_broken_pbo = 0;
|
|
MP_VERBOSE(vo, "Running on OpenGL '%s' by '%s', version '%s'\n",
|
|
renderer, vendor, version);
|
|
if (is_ati && strncmp(version, "2.1.", 4) == 0) {
|
|
int ver = atoi(version + 4);
|
|
MP_VERBOSE(vo, "Detected ATI driver version: %i\n", ver);
|
|
ati_broken_pbo = ver && ver < 8395;
|
|
}
|
|
if (p->ati_hack == -1)
|
|
p->ati_hack = ati_broken_pbo;
|
|
if (p->force_pbo == -1) {
|
|
p->force_pbo = 0;
|
|
if (extensions && strstr(extensions, "_pixel_buffer_object"))
|
|
p->force_pbo = is_ati;
|
|
}
|
|
p->have_texture_rg = extensions && strstr(extensions, "GL_ARB_texture_rg");
|
|
if (p->use_rectangle == -1) {
|
|
p->use_rectangle = 0;
|
|
if (extensions) {
|
|
// if (strstr(extensions, "_texture_non_power_of_two"))
|
|
if (strstr(extensions, "_texture_rectangle"))
|
|
p->use_rectangle = renderer
|
|
&& strstr(renderer, "Mesa DRI R200") ? 1 : 0;
|
|
}
|
|
}
|
|
if (p->use_yuv == -1)
|
|
p->use_yuv = glAutodetectYUVConversion(gl);
|
|
|
|
int eq_caps = 0;
|
|
int yuv_mask = (1 << p->use_yuv);
|
|
if (!(yuv_mask & MASK_NOT_COMBINERS)) {
|
|
// combiners
|
|
eq_caps = (1 << MP_CSP_EQ_HUE) | (1 << MP_CSP_EQ_SATURATION);
|
|
} else if (yuv_mask & MASK_ALL_YUV) {
|
|
eq_caps = MP_CSP_EQ_CAPS_COLORMATRIX;
|
|
if (yuv_mask & MASK_GAMMA_SUPPORT)
|
|
eq_caps |= MP_CSP_EQ_CAPS_GAMMA;
|
|
}
|
|
p->video_eq.capabilities = eq_caps;
|
|
|
|
{
|
|
int target = p->use_rectangle == 1 ? GL_TEXTURE_RECTANGLE : GL_TEXTURE_2D;
|
|
GLint gl_texfmt;
|
|
GLenum gl_format, gl_type;
|
|
glFindFormat(IMGFMT_420P16, p->have_texture_rg, NULL, &gl_texfmt,
|
|
&gl_format, &gl_type);
|
|
glCreateClearTex(gl, target, gl_texfmt, gl_format, gl_type,
|
|
GL_LINEAR, 64, 64, 0);
|
|
int tex_size_token = p->have_texture_rg ? GL_TEXTURE_RED_SIZE
|
|
: GL_TEXTURE_INTENSITY_SIZE;
|
|
GLint size = 8;
|
|
gl->GetTexLevelParameteriv(target, 0, tex_size_token, &size);
|
|
MP_VERBOSE(vo, "16 bit texture depth: %d.\n", size);
|
|
p->max_tex_component_size = size;
|
|
}
|
|
|
|
if (is_ati && (p->lscale == 1 || p->lscale == 2 || p->cscale == 1 || p->cscale == 2))
|
|
MP_WARN(vo, "Selected scaling mode may be broken on"
|
|
" ATI cards.\nTell _them_ to fix GL_REPEAT if you have issues.\n");
|
|
MP_VERBOSE(vo, "Settings after autodetection: ati-hack = %i, "
|
|
"force-pbo = %i, rectangle = %i, yuv = %i\n",
|
|
p->ati_hack, p->force_pbo, p->use_rectangle, p->use_yuv);
|
|
}
|
|
|
|
static GLint get_scale_type(struct vo *vo, int chroma)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
int nearest = (chroma ? p->cscale : p->lscale) & 64;
|
|
if (nearest)
|
|
return p->mipmap_gen ? GL_NEAREST_MIPMAP_NEAREST : GL_NEAREST;
|
|
return p->mipmap_gen ? GL_LINEAR_MIPMAP_NEAREST : GL_LINEAR;
|
|
}
|
|
|
|
// Return the high byte of the value that represents white in chroma (U/V)
|
|
static int get_chroma_clear_val(int bit_depth)
|
|
{
|
|
return 1 << (bit_depth - 1 & 7);
|
|
}
|
|
|
|
/**
|
|
* \brief Initialize a (new or reused) OpenGL context.
|
|
* set global gl-related variables to their default values
|
|
*/
|
|
static int initGl(struct vo *vo, uint32_t d_width, uint32_t d_height)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
GLint scale_type = get_scale_type(vo, 0);
|
|
autodetectGlExtensions(vo);
|
|
p->target = p->use_rectangle == 1 ? GL_TEXTURE_RECTANGLE : GL_TEXTURE_2D;
|
|
p->yuvconvtype = SET_YUV_CONVERSION(p->use_yuv) |
|
|
SET_YUV_LUM_SCALER(p->lscale) |
|
|
SET_YUV_CHROM_SCALER(p->cscale);
|
|
|
|
texSize(vo, p->image_width, p->image_height,
|
|
&p->texture_width, &p->texture_height);
|
|
|
|
gl->Disable(GL_BLEND);
|
|
gl->Disable(GL_DEPTH_TEST);
|
|
gl->DepthMask(GL_FALSE);
|
|
gl->Disable(GL_CULL_FACE);
|
|
gl->Enable(p->target);
|
|
gl->DrawBuffer(GL_BACK);
|
|
gl->TexEnvi(GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, GL_MODULATE);
|
|
|
|
MP_VERBOSE(vo, "Creating %dx%d texture...\n",
|
|
p->texture_width, p->texture_height);
|
|
|
|
glCreateClearTex(gl, p->target, p->texfmt, p->gl_format,
|
|
p->gl_type, scale_type,
|
|
p->texture_width, p->texture_height, 0);
|
|
|
|
if (p->mipmap_gen)
|
|
gl->TexParameteri(p->target, GL_GENERATE_MIPMAP, GL_TRUE);
|
|
|
|
if (p->is_yuv) {
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(p->image_format);
|
|
int i;
|
|
int xs = desc.chroma_xs, ys = desc.chroma_ys, depth = desc.plane_bits;
|
|
scale_type = get_scale_type(vo, 1);
|
|
int clear = get_chroma_clear_val(depth);
|
|
gl->GenTextures(21, p->default_texs);
|
|
p->default_texs[21] = 0;
|
|
for (i = 0; i < 7; i++) {
|
|
gl->ActiveTexture(GL_TEXTURE1 + i);
|
|
gl->BindTexture(GL_TEXTURE_2D, p->default_texs[i]);
|
|
gl->BindTexture(GL_TEXTURE_RECTANGLE, p->default_texs[i + 7]);
|
|
gl->BindTexture(GL_TEXTURE_3D, p->default_texs[i + 14]);
|
|
}
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
glCreateClearTex(gl, p->target, p->texfmt, p->gl_format,
|
|
p->gl_type, scale_type,
|
|
p->texture_width >> xs, p->texture_height >> ys,
|
|
clear);
|
|
if (p->mipmap_gen)
|
|
gl->TexParameteri(p->target, GL_GENERATE_MIPMAP, GL_TRUE);
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
glCreateClearTex(gl, p->target, p->texfmt, p->gl_format,
|
|
p->gl_type, scale_type,
|
|
p->texture_width >> xs, p->texture_height >> ys,
|
|
clear);
|
|
if (p->mipmap_gen)
|
|
gl->TexParameteri(p->target, GL_GENERATE_MIPMAP, GL_TRUE);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
gl->BindTexture(p->target, 0);
|
|
}
|
|
if (p->is_yuv || p->custom_prog) {
|
|
if ((MASK_NOT_COMBINERS & (1 << p->use_yuv)) || p->custom_prog) {
|
|
if (!gl->GenPrograms || !gl->BindProgram)
|
|
MP_ERR(vo, "fragment program functions missing!\n");
|
|
else {
|
|
gl->GenPrograms(1, &p->fragprog);
|
|
gl->BindProgram(GL_FRAGMENT_PROGRAM, p->fragprog);
|
|
}
|
|
}
|
|
update_yuvconv(vo);
|
|
}
|
|
|
|
if (gl->BindTexture) {
|
|
p->osd = mpgl_osd_init(gl, vo->log, vo->osd);
|
|
p->osd->scaled = p->scaled_osd;
|
|
}
|
|
|
|
resize(vo, d_width, d_height);
|
|
|
|
gl->ClearColor(0.0f, 0.0f, 0.0f, 0.0f);
|
|
gl->Clear(GL_COLOR_BUFFER_BIT);
|
|
if (gl->SwapInterval && p->swap_interval >= 0)
|
|
gl->SwapInterval(p->swap_interval);
|
|
return 1;
|
|
}
|
|
|
|
static bool config_window(struct vo *vo, int flags)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
if (p->stereo_mode == GL_3D_QUADBUFFER)
|
|
flags |= VOFLAG_STEREO;
|
|
|
|
int mpgl_caps = MPGL_CAP_GL_LEGACY;
|
|
if (!p->allow_sw)
|
|
mpgl_caps |= MPGL_CAP_NO_SW;
|
|
return mpgl_config_window(p->glctx, mpgl_caps, flags);
|
|
}
|
|
|
|
static int reconfig(struct vo *vo, struct mp_image_params *params, int flags)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(params->imgfmt);
|
|
|
|
p->image_height = params->h;
|
|
p->image_width = params->w;
|
|
p->image_format = params->imgfmt;
|
|
p->is_yuv = !!(desc.flags & MP_IMGFLAG_YUV_P);
|
|
p->is_yuv |= (desc.chroma_xs << 8) | (desc.chroma_ys << 16);
|
|
if (p->image_format == IMGFMT_Y8)
|
|
p->is_yuv = 0;
|
|
glFindFormat(p->image_format, p->have_texture_rg, NULL, &p->texfmt,
|
|
&p->gl_format, &p->gl_type);
|
|
|
|
p->vo_flipped = !!(flags & VOFLAG_FLIPPING);
|
|
|
|
uninitGl(vo);
|
|
|
|
if (!config_window(vo, flags))
|
|
return -1;
|
|
|
|
initGl(vo, vo->dwidth, vo->dheight);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void do_render(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
// Enable(GL_TEXTURE_2D);
|
|
// BindTexture(GL_TEXTURE_2D, texture_id);
|
|
|
|
gl->Color4f(1, 1, 1, 1);
|
|
if (p->is_yuv || p->custom_prog)
|
|
glEnableYUVConversion(gl, p->target, p->yuvconvtype);
|
|
int src_w = p->src_rect.x1 - p->src_rect.x0;
|
|
int src_h = p->src_rect.y1 - p->src_rect.y0;
|
|
int dst_w = p->dst_rect.x1 - p->dst_rect.x0;
|
|
int dst_h = p->dst_rect.y1 - p->dst_rect.y0;
|
|
if (p->stereo_mode) {
|
|
glEnable3DLeft(gl, p->stereo_mode);
|
|
glDrawTex(gl,
|
|
p->dst_rect.x0, p->dst_rect.y0, dst_w, dst_h,
|
|
p->src_rect.x0 / 2, p->src_rect.y0, src_w / 2, src_h,
|
|
p->texture_width, p->texture_height,
|
|
p->use_rectangle == 1, p->is_yuv,
|
|
p->mpi_flipped ^ p->vo_flipped);
|
|
glEnable3DRight(gl, p->stereo_mode);
|
|
glDrawTex(gl,
|
|
p->dst_rect.x0, p->dst_rect.y0, dst_w, dst_h,
|
|
p->src_rect.x0 / 2 + p->image_width / 2, p->src_rect.y0,
|
|
src_w / 2, src_h,
|
|
p->texture_width, p->texture_height,
|
|
p->use_rectangle == 1, p->is_yuv,
|
|
p->mpi_flipped ^ p->vo_flipped);
|
|
glDisable3D(gl, p->stereo_mode);
|
|
} else {
|
|
glDrawTex(gl,
|
|
p->dst_rect.x0, p->dst_rect.y0, dst_w, dst_h,
|
|
p->src_rect.x0, p->src_rect.y0, src_w, src_h,
|
|
p->texture_width, p->texture_height,
|
|
p->use_rectangle == 1, p->is_yuv,
|
|
p->mpi_flipped ^ p->vo_flipped);
|
|
}
|
|
if (p->is_yuv || p->custom_prog)
|
|
glDisableYUVConversion(gl, p->target, p->yuvconvtype);
|
|
|
|
draw_osd(vo);
|
|
}
|
|
|
|
static void flip_page(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
if (p->use_glFinish)
|
|
gl->Finish();
|
|
p->glctx->swapGlBuffers(p->glctx);
|
|
|
|
if (p->dst_rect.x0 > 0|| p->dst_rect.y0 > 0 ||
|
|
p->dst_rect.x1 < vo->dwidth || p->dst_rect.y1 < vo->dheight)
|
|
{
|
|
gl->Clear(GL_COLOR_BUFFER_BIT);
|
|
}
|
|
}
|
|
|
|
static bool get_image(struct vo *vo, mp_image_t *mpi, int *th, bool *cplane)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
bool common_plane = false;
|
|
|
|
int needed_size;
|
|
if (!gl->GenBuffers || !gl->BindBuffer || !gl->BufferData || !gl->MapBuffer) {
|
|
if (!p->err_shown)
|
|
MP_ERR(vo, "extensions missing for dr\nExpect a _major_ speed penalty\n");
|
|
p->err_shown = 1;
|
|
return false;
|
|
}
|
|
int width = mpi->w, height = mpi->h;
|
|
if (p->ati_hack) {
|
|
width = p->texture_width;
|
|
height = p->texture_height;
|
|
}
|
|
int avgbpp16 = 0;
|
|
for (int pl = 0; pl < 4; pl++)
|
|
avgbpp16 += (16 * mpi->fmt.bpp[pl]) >> mpi->fmt.xs[pl] >> mpi->fmt.ys[pl];
|
|
int avgbpp = avgbpp16 / 16;
|
|
mpi->stride[0] = width * avgbpp / 8;
|
|
needed_size = mpi->stride[0] * height;
|
|
if (!p->buffer)
|
|
gl->GenBuffers(1, &p->buffer);
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer);
|
|
if (needed_size > p->buffersize) {
|
|
p->buffersize = needed_size;
|
|
gl->BufferData(GL_PIXEL_UNPACK_BUFFER, p->buffersize,
|
|
NULL, GL_DYNAMIC_DRAW);
|
|
}
|
|
if (!p->bufferptr)
|
|
p->bufferptr = gl->MapBuffer(GL_PIXEL_UNPACK_BUFFER, GL_WRITE_ONLY);
|
|
mpi->planes[0] = p->bufferptr;
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, 0);
|
|
if (!mpi->planes[0]) {
|
|
if (!p->err_shown)
|
|
MP_ERR(vo, "could not acquire buffer for dr\n"
|
|
"Expect a _major_ speed penalty\n");
|
|
p->err_shown = 1;
|
|
return false;
|
|
}
|
|
if (p->is_yuv) {
|
|
// planar YUV
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(p->image_format);
|
|
int xs = desc.chroma_xs, ys = desc.chroma_ys, depth = desc.plane_bits;
|
|
int bp = (depth + 7) / 8;
|
|
common_plane = true;
|
|
mpi->stride[0] = width * bp;
|
|
mpi->planes[1] = mpi->planes[0] + mpi->stride[0] * height;
|
|
mpi->stride[1] = (width >> xs) * bp;
|
|
mpi->planes[2] = mpi->planes[1] + mpi->stride[1] * (height >> ys);
|
|
mpi->stride[2] = (width >> xs) * bp;
|
|
if (p->ati_hack) {
|
|
common_plane = false;
|
|
if (!p->buffer_uv[0])
|
|
gl->GenBuffers(2, p->buffer_uv);
|
|
int buffer_size = mpi->stride[1] * height;
|
|
if (buffer_size > p->buffersize_uv) {
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer_uv[0]);
|
|
gl->BufferData(GL_PIXEL_UNPACK_BUFFER, buffer_size, NULL,
|
|
GL_DYNAMIC_DRAW);
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer_uv[1]);
|
|
gl->BufferData(GL_PIXEL_UNPACK_BUFFER, buffer_size, NULL,
|
|
GL_DYNAMIC_DRAW);
|
|
p->buffersize_uv = buffer_size;
|
|
}
|
|
if (!p->bufferptr_uv[0]) {
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer_uv[0]);
|
|
p->bufferptr_uv[0] = gl->MapBuffer(GL_PIXEL_UNPACK_BUFFER,
|
|
GL_WRITE_ONLY);
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer_uv[1]);
|
|
p->bufferptr_uv[1] = gl->MapBuffer(GL_PIXEL_UNPACK_BUFFER,
|
|
GL_WRITE_ONLY);
|
|
}
|
|
mpi->planes[1] = p->bufferptr_uv[0];
|
|
mpi->planes[2] = p->bufferptr_uv[1];
|
|
}
|
|
}
|
|
*th = height;
|
|
*cplane = common_plane;
|
|
return true;
|
|
}
|
|
|
|
static void clear_border(struct vo *vo, uint8_t *dst, int start, int stride,
|
|
int height, int full_height, int value)
|
|
{
|
|
int right_border = stride - start;
|
|
int bottom_border = full_height - height;
|
|
while (height > 0) {
|
|
if (right_border > 0)
|
|
memset(dst + start, value, right_border);
|
|
dst += stride;
|
|
height--;
|
|
}
|
|
if (bottom_border > 0)
|
|
memset(dst, value, stride * bottom_border);
|
|
}
|
|
|
|
static void draw_image(struct vo *vo, mp_image_t *mpi)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
p->osd_pts = mpi->pts;
|
|
|
|
int slice = p->slice_height;
|
|
int stride[3];
|
|
unsigned char *planes[3];
|
|
mp_image_t mpi2 = *mpi;
|
|
int w = mpi->w, h = mpi->h;
|
|
int th = h;
|
|
bool common_plane = false;
|
|
bool pbo = false;
|
|
mpi2.flags = 0;
|
|
if (p->force_pbo && !p->bufferptr
|
|
&& get_image(vo, &mpi2, &th, &common_plane))
|
|
{
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(p->image_format);
|
|
int bp = desc.bytes[0];
|
|
int xs = desc.chroma_xs, ys = desc.chroma_ys, depth = desc.plane_bits;
|
|
memcpy_pic(mpi2.planes[0], mpi->planes[0], mpi->w * bp, mpi->h,
|
|
mpi2.stride[0], mpi->stride[0]);
|
|
int uv_bytes = (mpi->w >> xs) * bp;
|
|
if (p->is_yuv) {
|
|
memcpy_pic(mpi2.planes[1], mpi->planes[1], uv_bytes, mpi->h >> ys,
|
|
mpi2.stride[1], mpi->stride[1]);
|
|
memcpy_pic(mpi2.planes[2], mpi->planes[2], uv_bytes, mpi->h >> ys,
|
|
mpi2.stride[2], mpi->stride[2]);
|
|
}
|
|
if (p->ati_hack) {
|
|
// since we have to do a full upload we need to clear the borders
|
|
clear_border(vo, mpi2.planes[0], mpi->w * bp, mpi2.stride[0],
|
|
mpi->h, th, 0);
|
|
if (p->is_yuv) {
|
|
int clear = get_chroma_clear_val(depth);
|
|
clear_border(vo, mpi2.planes[1], uv_bytes, mpi2.stride[1],
|
|
mpi->h >> ys, th >> ys, clear);
|
|
clear_border(vo, mpi2.planes[2], uv_bytes, mpi2.stride[2],
|
|
mpi->h >> ys, th >> ys, clear);
|
|
}
|
|
}
|
|
mpi = &mpi2;
|
|
pbo = true;
|
|
}
|
|
stride[0] = mpi->stride[0];
|
|
stride[1] = mpi->stride[1];
|
|
stride[2] = mpi->stride[2];
|
|
planes[0] = mpi->planes[0];
|
|
planes[1] = mpi->planes[1];
|
|
planes[2] = mpi->planes[2];
|
|
p->mpi_flipped = stride[0] < 0;
|
|
if (pbo) {
|
|
intptr_t base = (intptr_t)planes[0];
|
|
if (p->ati_hack) {
|
|
w = p->texture_width;
|
|
h = p->texture_height;
|
|
}
|
|
if (p->mpi_flipped)
|
|
base += (mpi->h - 1) * stride[0];
|
|
planes[0] -= base;
|
|
planes[1] -= base;
|
|
planes[2] -= base;
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer);
|
|
gl->UnmapBuffer(GL_PIXEL_UNPACK_BUFFER);
|
|
p->bufferptr = NULL;
|
|
if (!common_plane)
|
|
planes[0] = planes[1] = planes[2] = NULL;
|
|
slice = 0; // always "upload" full texture
|
|
}
|
|
glUploadTex(gl, p->target, p->gl_format, p->gl_type, planes[0],
|
|
stride[0], 0, 0, w, h, slice);
|
|
if (p->is_yuv) {
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(p->image_format);
|
|
int xs = desc.chroma_xs, ys = desc.chroma_ys;
|
|
if (pbo && !common_plane) {
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer_uv[0]);
|
|
gl->UnmapBuffer(GL_PIXEL_UNPACK_BUFFER);
|
|
p->bufferptr_uv[0] = NULL;
|
|
}
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
glUploadTex(gl, p->target, p->gl_format, p->gl_type, planes[1],
|
|
stride[1], 0, 0, w >> xs, h >> ys, slice);
|
|
if (pbo && !common_plane) {
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, p->buffer_uv[1]);
|
|
gl->UnmapBuffer(GL_PIXEL_UNPACK_BUFFER);
|
|
p->bufferptr_uv[1] = NULL;
|
|
}
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
glUploadTex(gl, p->target, p->gl_format, p->gl_type, planes[2],
|
|
stride[2], 0, 0, w >> xs, h >> ys, slice);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
}
|
|
if (pbo) {
|
|
gl->BindBuffer(GL_PIXEL_UNPACK_BUFFER, 0);
|
|
}
|
|
|
|
do_render(vo);
|
|
|
|
talloc_free(mpi);
|
|
}
|
|
|
|
static mp_image_t *get_screenshot(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
GL *gl = p->gl;
|
|
|
|
if (!vo->params)
|
|
return NULL;
|
|
|
|
mp_image_t *image = mp_image_alloc(p->image_format, p->texture_width,
|
|
p->texture_height);
|
|
if (!image)
|
|
return NULL;
|
|
|
|
glDownloadTex(gl, p->target, p->gl_format, p->gl_type, image->planes[0],
|
|
image->stride[0]);
|
|
|
|
if (p->is_yuv) {
|
|
gl->ActiveTexture(GL_TEXTURE1);
|
|
glDownloadTex(gl, p->target, p->gl_format, p->gl_type, image->planes[1],
|
|
image->stride[1]);
|
|
gl->ActiveTexture(GL_TEXTURE2);
|
|
glDownloadTex(gl, p->target, p->gl_format, p->gl_type, image->planes[2],
|
|
image->stride[2]);
|
|
gl->ActiveTexture(GL_TEXTURE0);
|
|
}
|
|
mp_image_set_size(image, p->image_width, p->image_height);
|
|
mp_image_set_attributes(image, vo->params);
|
|
|
|
return image;
|
|
}
|
|
|
|
static int query_format(struct vo *vo, uint32_t format)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
struct mp_imgfmt_desc desc = mp_imgfmt_get_desc(format);
|
|
|
|
int depth = desc.plane_bits;
|
|
int caps = VFCAP_CSP_SUPPORTED | VFCAP_CSP_SUPPORTED_BY_HW;
|
|
if (format == IMGFMT_RGB24 || format == IMGFMT_RGBA)
|
|
return caps;
|
|
if (p->use_yuv && (desc.flags & MP_IMGFLAG_YUV_P) &&
|
|
(depth == 8 || depth == 16 ||
|
|
p->max_tex_component_size >= 16 && glYUVLargeRange(p->use_yuv)) &&
|
|
(depth <= 16 && (desc.flags & MP_IMGFLAG_NE)))
|
|
return caps;
|
|
// HACK, otherwise we get only b&w with some filters (e.g. -vf eq)
|
|
// ideally MPlayer should be fixed instead not to use Y800 when it has the choice
|
|
if (!p->use_yuv && (format == IMGFMT_Y8))
|
|
return 0;
|
|
if (!p->use_ycbcr && (format == IMGFMT_UYVY))
|
|
return 0;
|
|
if (p->many_fmts &&
|
|
glFindFormat(format, p->have_texture_rg, NULL, NULL, NULL, NULL))
|
|
return caps;
|
|
return 0;
|
|
}
|
|
|
|
static void uninit(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
uninitGl(vo);
|
|
mpgl_uninit(p->glctx);
|
|
p->glctx = NULL;
|
|
p->gl = NULL;
|
|
}
|
|
|
|
static int preinit(struct vo *vo)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
if (p->use_yuv == 1) {
|
|
MP_WARN(vo, "yuv=1 (nVidia register combiners) have"
|
|
" been removed, using yuv=2 instead.\n");
|
|
p->use_yuv = 2;
|
|
}
|
|
|
|
p->glctx = mpgl_init(vo, p->backend_arg);
|
|
if (!p->glctx)
|
|
goto err_out;
|
|
p->gl = p->glctx->gl;
|
|
|
|
if (p->use_yuv == -1) {
|
|
if (!config_window(vo, VOFLAG_HIDDEN))
|
|
goto err_out;
|
|
autodetectGlExtensions(vo);
|
|
}
|
|
MP_VERBOSE(vo, "Using %d as slice height "
|
|
"(0 means image height).\n", p->slice_height);
|
|
|
|
return 0;
|
|
|
|
err_out:
|
|
uninit(vo);
|
|
return -1;
|
|
}
|
|
|
|
static int control(struct vo *vo, uint32_t request, void *data)
|
|
{
|
|
struct gl_priv *p = vo->priv;
|
|
|
|
switch (request) {
|
|
case VOCTRL_GET_PANSCAN:
|
|
return VO_TRUE;
|
|
case VOCTRL_SET_PANSCAN:
|
|
resize(vo, vo->dwidth, vo->dheight);
|
|
return VO_TRUE;
|
|
case VOCTRL_GET_EQUALIZER:
|
|
if (p->is_yuv) {
|
|
struct voctrl_get_equalizer_args *args = data;
|
|
return mp_csp_equalizer_get(&p->video_eq, args->name, args->valueptr)
|
|
>= 0 ? VO_TRUE : VO_NOTIMPL;
|
|
}
|
|
break;
|
|
case VOCTRL_SET_EQUALIZER:
|
|
if (p->is_yuv) {
|
|
struct voctrl_set_equalizer_args *args = data;
|
|
if (mp_csp_equalizer_set(&p->video_eq, args->name, args->value) < 0)
|
|
return VO_NOTIMPL;
|
|
update_yuvconv(vo);
|
|
vo->want_redraw = true;
|
|
return VO_TRUE;
|
|
}
|
|
break;
|
|
case VOCTRL_GET_COLORSPACE: {
|
|
struct mp_image_params *params = data;
|
|
bool supports_csp = (1 << p->use_yuv) & MASK_NOT_COMBINERS;
|
|
if (vo->params && supports_csp) {
|
|
params->colorspace = vo->params->colorspace;
|
|
params->colorlevels = vo->params->colorlevels;
|
|
params->outputlevels = vo->params->outputlevels;
|
|
}
|
|
return VO_TRUE;
|
|
}
|
|
case VOCTRL_REDRAW_FRAME:
|
|
do_render(vo);
|
|
return true;
|
|
case VOCTRL_SCREENSHOT: {
|
|
struct voctrl_screenshot_args *args = data;
|
|
if (args->full_window)
|
|
args->out_image = glGetWindowScreenshot(p->gl);
|
|
else
|
|
args->out_image = get_screenshot(vo);
|
|
return true;
|
|
}
|
|
}
|
|
|
|
int events = 0;
|
|
int r = p->glctx->vo_control(vo, &events, request, data);
|
|
if (events & VO_EVENT_RESIZE)
|
|
resize(vo, vo->dwidth, vo->dheight);
|
|
if (events & VO_EVENT_EXPOSE)
|
|
vo->want_redraw = true;
|
|
|
|
return r;
|
|
}
|
|
|
|
#define OPT_BASE_STRUCT struct gl_priv
|
|
|
|
const struct vo_driver video_out_opengl_old = {
|
|
.description = "OpenGL (legacy VO, may work better on older GPUs)",
|
|
.name = "opengl-old",
|
|
.preinit = preinit,
|
|
.query_format = query_format,
|
|
.reconfig = reconfig,
|
|
.control = control,
|
|
.draw_image = draw_image,
|
|
.flip_page = flip_page,
|
|
.uninit = uninit,
|
|
.priv_size = sizeof(struct gl_priv),
|
|
.priv_defaults = &(const struct gl_priv) {
|
|
.many_fmts = 1,
|
|
.use_yuv = -1,
|
|
.filter_strength = 0.5,
|
|
.use_rectangle = -1,
|
|
.ati_hack = -1,
|
|
.force_pbo = -1,
|
|
.swap_interval = 1,
|
|
.custom_prog = NULL,
|
|
.custom_tex = NULL,
|
|
.custom_tlin = 1,
|
|
.osd_color = 0xffffff,
|
|
},
|
|
.options = (const struct m_option[]) {
|
|
OPT_FLAG("manyfmts", many_fmts, 0),
|
|
OPT_FLAG("scaled-osd", scaled_osd, 0),
|
|
OPT_FLAG("ycbcr", use_ycbcr, 0),
|
|
OPT_INT("slice-height", slice_height, M_OPT_MIN, .min = 0),
|
|
OPT_INT("rectangle", use_rectangle, M_OPT_MIN, .min = -1),
|
|
OPT_INT("yuv", use_yuv, M_OPT_MIN, .min = -1),
|
|
OPT_INT("lscale", lscale, M_OPT_MIN, .min = 0),
|
|
OPT_INT("cscale", cscale, M_OPT_MIN, .min = 0),
|
|
OPT_FLOAT("filter-strength", filter_strength, 0),
|
|
OPT_FLOAT("noise-strength", noise_strength, 0),
|
|
OPT_CHOICE("ati-hack", ati_hack, 0,
|
|
({"auto", -1}, {"no", 0}, {"yes", 1})),
|
|
OPT_CHOICE("force-pbo", force_pbo, 0,
|
|
({"auto", -1}, {"no", 0}, {"yes", 1})),
|
|
OPT_FLAG("glfinish", use_glFinish, 0),
|
|
OPT_INT("swapinterval", swap_interval, 0),
|
|
OPT_STRING("customprog", custom_prog, 0),
|
|
OPT_STRING("customtex", custom_tex, 0),
|
|
OPT_FLAG("customtlin", custom_tlin, 0),
|
|
OPT_FLAG("customtrect", custom_trect, 0),
|
|
OPT_FLAG("mipmapgen", mipmap_gen, 0),
|
|
OPT_INT("osdcolor", osd_color, 0),
|
|
OPT_INT("stereo", stereo_mode, 0),
|
|
OPT_FLAG("sw", allow_sw, 0),
|
|
OPT_STRING_VALIDATE("backend", backend_arg, 0, mpgl_validate_backend_opt),
|
|
{0}
|
|
},
|
|
};
|