mpv/libvo/vo_tdfx_vid.c

670 lines
18 KiB
C

/*
* copyright (C) 2003 Alban Bedel
*
* This file is part of MPlayer.
*
* MPlayer is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* MPlayer is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with MPlayer; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
*/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>
#include <sys/ioctl.h>
#include <sys/mman.h>
#include "config.h"
#include "video_out.h"
#include "video_out_internal.h"
#include "aspect.h"
#include "mp_msg.h"
#include "help_mp.h"
#include "fastmemcpy.h"
#include "drivers/tdfx_vid.h"
static const vo_info_t info =
{
"tdfx vid",
"tdfx_vid",
"Albeu",
""
};
//#define VERBOSE
const LIBVO_EXTERN(tdfx_vid)
static tdfx_vid_config_t tdfx_cfg;
static unsigned char* agp_mem = NULL;
static int tdfx_fd = -1;
static uint32_t img_fmt; // The real input format
static uint32_t src_width, src_height, src_fmt, src_bpp, src_stride;
static uint32_t dst_width, dst_height, dst_fmt, dst_bpp, dst_stride;
static uint32_t tdfx_page;
static uint32_t front_buffer;
static uint32_t back_buffer;
static uint8_t num_buffer = 3;
static uint32_t buffer_size; // Max size
static uint8_t current_buffer = 0;
static uint8_t current_ip_buf = 0;
static uint32_t buffer_stride[3];
static int use_overlay = 1;
static tdfx_vid_overlay_t tdfx_ov;
// FIXME
#if 0
static void clear_screen(void) {
tdfx_vid_agp_move_t mov;
memset(agp_mem,0,tdfx_cfg.screen_width*dst_bpp*tdfx_cfg.screen_height);
mov.move2 = TDFX_VID_MOVE_2_PACKED;
mov.width = tdfx_cfg.screen_width*dst_bpp;
mov.height = tdfx_cfg.screen_height;
mov.src = 0;
mov.src_stride = tdfx_cfg.screen_width*dst_bpp;
mov.dst = front_buffer;
mov.dst_stride = tdfx_cfg.screen_stride;
mp_msg(MSGT_VO,MSGL_INFO, MSGTR_LIBVO_TDFXVID_Move, mov.width,mov.src_stride,mov.height,mov.dst_stride);
if(ioctl(tdfx_fd,TDFX_VID_AGP_MOVE,&mov))
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_AGPMoveFailedToClearTheScreen);
}
#endif
static int draw_slice(uint8_t *image[], int stride[], int w,int h,int x,int y)
{
uint8_t* ptr[3];
#ifdef VERBOSE
printf("Draw slices %d\n",current_buffer);
#endif
switch(img_fmt) {
case IMGFMT_YUY2:
case IMGFMT_UYVY:
case IMGFMT_BGR8:
case IMGFMT_BGR16:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
// copy :( to agp_mem
// still faster than tdfxfb wich directly copy to the video mem :)
mem2agpcpy_pic(agp_mem + current_buffer * buffer_size +
y*buffer_stride[0] + x * src_bpp,
image[0],
src_bpp*w,h,buffer_stride[0],stride[0]);
return 0;
case IMGFMT_YV12:
case IMGFMT_I420:
// Copy to agp mem
ptr[0] = agp_mem + current_buffer * buffer_size;
mem2agpcpy_pic(ptr[0] + y * buffer_stride[0] + x,image[0],w,h,
buffer_stride[0],stride[0]);
ptr[1] = ptr[0] + (src_height*src_width);
mem2agpcpy_pic(ptr[1] + y/2 * buffer_stride[1] + x/2,image[1],w/2,h/2,
buffer_stride[1],stride[1]);
ptr[2] = ptr[1] + (src_height*src_width/4);
mem2agpcpy_pic(ptr[2] + y/2 * buffer_stride[2] + x/2,image[2],w/2,h/2,
buffer_stride[2],stride[2]);
return 0;
}
return 1;
}
static void draw_osd(void)
{
}
static void
flip_page(void)
{
tdfx_vid_blit_t blit;
//return;
// Scale convert
#ifdef VERBOSE
printf("Flip\n");
#endif
if(use_overlay) {
// TDFX_VID_OVERLAY_ON does nothing if the overlay is already on
if(!ioctl(tdfx_fd,TDFX_VID_OVERLAY_ON)) { // X11 killed the overlay :(
if(ioctl(tdfx_fd,TDFX_VID_SET_OVERLAY,&tdfx_ov))
mp_msg(MSGT_VO, MSGL_ERR, "tdfx_vid: set_overlay failed\n");
}
// These formats need conversion
switch(src_fmt) {
case IMGFMT_BGR8:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
memset(&blit,0,sizeof(tdfx_vid_blit_t));
blit.src = back_buffer;
blit.src_stride = src_stride;
blit.src_x = 0;
blit.src_y = 0;
blit.src_w = src_width;
blit.src_h = src_height;
blit.src_format = src_fmt;
blit.dst = front_buffer;
blit.dst_stride = dst_stride;
blit.dst_x = 0;
blit.dst_y = 0;
blit.dst_w = src_width;
blit.dst_h = src_height;
blit.dst_format = IMGFMT_BGR16;
if(ioctl(tdfx_fd,TDFX_VID_BLIT,&blit))
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_BlitFailed);
}
return;
}
memset(&blit,0,sizeof(tdfx_vid_blit_t));
blit.src = back_buffer;
blit.src_stride = src_stride;
blit.src_x = 0;
blit.src_y = 0;
blit.src_w = src_width;
blit.src_h = src_height;
blit.src_format = src_fmt;
blit.dst = front_buffer;
blit.dst_stride = dst_stride;
blit.dst_x = 0;
blit.dst_y = 0;
blit.dst_w = dst_width;
blit.dst_h = dst_height;
blit.dst_format = dst_fmt;
if(ioctl(tdfx_fd,TDFX_VID_BLIT,&blit))
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_BlitFailed);
}
static int
draw_frame(uint8_t *src[])
{
int stride[] = { src_stride, 0, 0};
return draw_slice(src,stride,src_width, src_height,0,0);
}
static int
query_format(uint32_t format)
{
switch(format) {
case IMGFMT_BGR8:
if(tdfx_cfg.screen_format == TDFX_VID_FORMAT_BGR8)
return VFCAP_CSP_SUPPORTED | VFCAP_CSP_SUPPORTED_BY_HW | VFCAP_HWSCALE_UP | VFCAP_HWSCALE_DOWN | VFCAP_ACCEPT_STRIDE;
return 0;
case IMGFMT_YUY2:
case IMGFMT_UYVY:
case IMGFMT_BGR15:
case IMGFMT_BGR16:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
case IMGFMT_YV12:
case IMGFMT_I420:
if(tdfx_cfg.screen_format == TDFX_VID_FORMAT_BGR8)
return 0;
return VFCAP_CSP_SUPPORTED | VFCAP_CSP_SUPPORTED_BY_HW | VFCAP_HWSCALE_UP | VFCAP_HWSCALE_DOWN | VFCAP_ACCEPT_STRIDE;
}
return 0;
}
static int
config(uint32_t width, uint32_t height, uint32_t d_width, uint32_t d_height, uint32_t flags, char *title, uint32_t format)
{
if(tdfx_fd < 0)
return 1;
// When we are run as sub vo we must follow the size gaven to us
if(!(flags & VOFLAG_XOVERLAY_SUB_VO)) {
if(!vo_screenwidth)
vo_screenwidth = tdfx_cfg.screen_width;
if(!vo_screenheight)
vo_screenheight = tdfx_cfg.screen_height;
aspect_save_orig(width,height);
aspect_save_prescale(d_width,d_height);
aspect_save_screenres(vo_screenwidth,vo_screenheight);
if(flags&VOFLAG_FULLSCREEN) { /* -fs */
aspect(&d_width,&d_height,A_ZOOM);
vo_fs = VO_TRUE;
} else {
aspect(&d_width,&d_height,A_NOZOOM);
vo_fs = VO_FALSE;
}
}
src_width = width;
src_height = height;
buffer_size = 0;
buffer_stride[0] = 0;
src_fmt = 0;
switch(format) {
case IMGFMT_BGR8:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
if(use_overlay)
mp_msg(MSGT_VO,MSGL_INFO, MSGTR_LIBVO_TDFXVID_NonNativeOverlayFormatNeedConversion);
case IMGFMT_BGR15:
case IMGFMT_BGR16:
src_bpp = ((format & 0x3F)+7)/8;
break;
case IMGFMT_YV12:
case IMGFMT_I420:
buffer_size = src_width * src_height * 3 / 2;
buffer_stride[0] = ((src_width+1)/2)*2;
buffer_stride[1] = buffer_stride[2] = buffer_stride[0]/2;
src_fmt = TDFX_VID_FORMAT_YUY2;
case IMGFMT_YUY2:
case IMGFMT_UYVY:
src_bpp = 2;
break;
default:
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_UnsupportedInputFormat,format);
return 1;
}
img_fmt = format;
src_stride = src_width*src_bpp;
// The overlay need a 4 bytes aligned stride
if(use_overlay)
src_stride = ((src_stride+3)/4)*4;
if(!src_fmt)
src_fmt = format;
if(!buffer_size)
buffer_size = src_stride*src_height;
if(!buffer_stride[0])
buffer_stride[0] = src_stride;
dst_fmt = tdfx_cfg.screen_format;
dst_bpp = ((dst_fmt & 0x3F)+7)/8;
dst_width = d_width;
dst_height = d_height;
dst_stride = tdfx_cfg.screen_stride;
tdfx_page = tdfx_cfg.screen_stride*tdfx_cfg.screen_height;
front_buffer = tdfx_cfg.screen_start;
back_buffer = front_buffer + tdfx_page;
while(use_overlay) {
tdfx_vid_overlay_t ov;
uint32_t ov_fmt = src_fmt, ov_stride = src_stride;
// Align the buffer
back_buffer = (((back_buffer+3)/4)*4);
// With the overlay the front buffer is not on the screen
// so we take the back buffer
front_buffer = back_buffer;
switch(src_fmt) {
case IMGFMT_BGR8:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
back_buffer = front_buffer + 2*(src_stride*src_height);
ov_stride = dst_stride = src_width<<1;
ov_fmt = IMGFMT_BGR16;
break;
}
ov.src[0] = front_buffer;
ov.src[1] = front_buffer + (src_stride*src_height);
ov.src_width = src_width;
ov.src_height = src_height;
ov.src_stride = ov_stride;
ov.format = ov_fmt;
ov.dst_width = dst_width;
ov.dst_height = dst_height;
ov.dst_x = vo_dx;
ov.dst_y = vo_dy;
ov.use_colorkey = 0;
if(ioctl(tdfx_fd,TDFX_VID_SET_OVERLAY,&ov)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_OverlaySetupFailed);
use_overlay = 0;
break;
}
tdfx_ov = ov;
if(use_overlay == 1) {
if(ioctl(tdfx_fd,TDFX_VID_OVERLAY_ON)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_OverlayOnFailed);
use_overlay = 0;
break;
}
use_overlay++;
}
mp_msg(MSGT_VO,MSGL_INFO, MSGTR_LIBVO_TDFXVID_OverlayReady,
src_width,src_stride,src_height,src_bpp,
dst_width,dst_stride,dst_height,dst_bpp);
break;
}
if(!use_overlay)
mp_msg(MSGT_VO,MSGL_INFO, MSGTR_LIBVO_TDFXVID_TextureBlitReady,
src_width,src_stride,src_height,src_bpp,
dst_width,dst_stride,dst_height,dst_bpp);
return 0;
}
static void
uninit(void)
{
if(use_overlay == 2) {
if(ioctl(tdfx_fd,TDFX_VID_OVERLAY_OFF))
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_OverlayOffFailed);
use_overlay--;
}
close(tdfx_fd);
tdfx_fd = -1;
}
static void check_events(void)
{
}
static int preinit(const char *arg)
{
tdfx_fd = open(arg ? arg : "/dev/tdfx_vid", O_RDWR);
if(tdfx_fd < 0) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_CantOpen,arg ? arg : "/dev/tdfx_vid",
strerror(errno));
return 1;
}
if(ioctl(tdfx_fd,TDFX_VID_GET_CONFIG,&tdfx_cfg)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_CantGetCurrentCfg,strerror(errno));
return 1;
}
mp_msg(MSGT_VO,MSGL_INFO, "tdfx_vid version %d\n"
" Ram: %d\n"
" Screen: %d x %d\n"
" Format: %c%c%c%d\n",
tdfx_cfg.version,
tdfx_cfg.ram_size,
tdfx_cfg.screen_width, tdfx_cfg.screen_height,
tdfx_cfg.screen_format>>24,(tdfx_cfg.screen_format>>16)&0xFF,
(tdfx_cfg.screen_format>>8)&0xFF,tdfx_cfg.screen_format&0xFF);
// For now just allocate more than i ever need
agp_mem = mmap( NULL, 1024*768*4, PROT_READ | PROT_WRITE, MAP_SHARED,
tdfx_fd, 0);
if(agp_mem == MAP_FAILED) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_MemmapFailed);
return 1;
}
memset(agp_mem,0,1024*768*4);
return 0;
}
static uint32_t get_image(mp_image_t *mpi) {
int buf = 0;
#ifdef VERBOSE
printf("Get image %d\n",buf);
#endif
// Currently read are too slow bcs we read from the
// agp aperture and not the memory directly
//if(mpi->flags&MP_IMGFLAG_READABLE) return VO_FALSE;
if(mpi->flags&MP_IMGFLAG_READABLE &&
(mpi->type==MP_IMGTYPE_IPB || mpi->type==MP_IMGTYPE_IP)){
// reference (I/P) frame of IP or IPB:
if(num_buffer<2) return VO_FALSE; // not enough
current_ip_buf^=1;
// for IPB with 2 buffers we can DR only one of the 2 P frames:
if(mpi->type==MP_IMGTYPE_IPB && num_buffer<3 && current_ip_buf) return VO_FALSE;
buf=current_ip_buf;
if(mpi->type==MP_IMGTYPE_IPB) ++buf; // preserve space for B
}
switch(mpi->imgfmt) {
case IMGFMT_YUY2:
case IMGFMT_UYVY:
case IMGFMT_BGR8:
case IMGFMT_BGR15:
case IMGFMT_BGR16:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
mpi->planes[0] = agp_mem + buf * buffer_size;
mpi->stride[0] = src_stride;
break;
case IMGFMT_YV12:
case IMGFMT_I420:
mpi->planes[0] = agp_mem + buf * buffer_size;
mpi->stride[0] = mpi->width;
mpi->planes[1] = mpi->planes[0] + mpi->stride[0]*mpi->height;
mpi->stride[1] = mpi->chroma_width;
mpi->planes[2] = mpi->planes[1] + mpi->stride[1]*mpi->chroma_height;
mpi->stride[2] = mpi->chroma_width;
break;
default:
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_GetImageTodo);
return VO_FALSE;
}
mpi->flags |= MP_IMGFLAG_DIRECT;
mpi->priv = (void*)buf;
return VO_TRUE;
}
static uint32_t start_slice(mp_image_t *mpi){
int buf = 0;
#ifdef VERBOSE
printf("Start slices %d\n",buf);
#endif
if(mpi->flags & MP_IMGFLAG_DIRECT)
buf = (int)mpi->priv;
current_buffer = buf;
return VO_TRUE;
}
static uint32_t draw_image(mp_image_t *mpi){
int buf = 0;
tdfx_vid_agp_move_t mov;
tdfx_vid_yuv_t yuv;
int p;
uint8_t* planes[3];
#ifdef VERBOSE
printf("Draw image %d\n",buf);
#endif
if(mpi->flags & MP_IMGFLAG_DIRECT)
buf = (int)mpi->priv;
switch(mpi->imgfmt) {
case IMGFMT_YUY2:
case IMGFMT_UYVY:
case IMGFMT_BGR8:
case IMGFMT_BGR15:
case IMGFMT_BGR16:
case IMGFMT_BGR24:
case IMGFMT_BGR32:
if(!(mpi->flags&(MP_IMGFLAG_DIRECT|MP_IMGFLAG_DRAW_CALLBACK))) {
// copy to agp_mem
#ifdef VERBOSE
printf("Memcpy\n");
#endif
planes[0] = agp_mem + buf * buffer_size;
mem2agpcpy_pic(planes[0],mpi->planes[0],src_bpp*mpi->width,mpi->height,
buffer_stride[0],mpi->stride[0]);
} else
planes[0] = agp_mem + buf * buffer_size;
mov.move2 = TDFX_VID_MOVE_2_PACKED;
mov.width = mpi->width*((mpi->bpp+7)/8);
mov.height = mpi->height;
mov.src = planes[0] - agp_mem;
mov.src_stride = buffer_stride[0];
mov.dst = back_buffer;
mov.dst_stride = src_stride;
if(ioctl(tdfx_fd,TDFX_VID_AGP_MOVE,&mov))
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_AgpMoveFailed);
break;
case IMGFMT_YV12:
case IMGFMT_I420:
if(!(mpi->flags&(MP_IMGFLAG_DIRECT|MP_IMGFLAG_DRAW_CALLBACK))) {
// Copy to agp mem
#ifdef VERBOSE
printf("Memcpy\n");
#endif
planes[0] = agp_mem + buf * buffer_size;
memcpy_pic(planes[0],mpi->planes[0],mpi->width,mpi->height,
buffer_stride[0],mpi->stride[0]);
planes[1] = planes[0] + (mpi->height*mpi->stride[0]);
memcpy_pic(planes[1],mpi->planes[1],mpi->chroma_width,mpi->chroma_height,
buffer_stride[1],mpi->stride[1]);
planes[2] = planes[1] + (mpi->chroma_height*mpi->stride[1]);
memcpy_pic(planes[2],mpi->planes[2],mpi->chroma_width,mpi->chroma_height,
buffer_stride[2],mpi->stride[2]);
} else {
planes[0] = agp_mem + buf * buffer_size;
planes[1] = planes[0] + buffer_stride[0] * src_height;
planes[2] = planes[1] + buffer_stride[1] * src_height/2;
}
// Setup the yuv thing
yuv.base = back_buffer;
yuv.stride = src_stride;
if(ioctl(tdfx_fd,TDFX_VID_SET_YUV,&yuv)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_SetYuvFailed);
break;
}
// Now agp move that
// Y
mov.move2 = TDFX_VID_MOVE_2_YUV;
mov.width = mpi->width;
mov.height = mpi->height;
mov.src = planes[0] - agp_mem;
mov.src_stride = buffer_stride[0];
mov.dst = 0x0;
mov.dst_stride = TDFX_VID_YUV_STRIDE;
if(ioctl(tdfx_fd,TDFX_VID_AGP_MOVE,&mov)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_AgpMoveFailedOnYPlane);
break;
}
//return 0;
// U
p = mpi->imgfmt == IMGFMT_YV12 ? 1 : 2;
mov.width = mpi->chroma_width;
mov.height = mpi->chroma_height;
mov.src = planes[p] - agp_mem;
mov.src_stride = buffer_stride[p];
mov.dst += TDFX_VID_YUV_PLANE_SIZE;
if(ioctl(tdfx_fd,TDFX_VID_AGP_MOVE,&mov)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_AgpMoveFailedOnUPlane);
break;
}
// V
p = mpi->imgfmt == IMGFMT_YV12 ? 2 : 1;
mov.src = planes[p] - agp_mem;
mov.src_stride = buffer_stride[p];
mov.dst += TDFX_VID_YUV_PLANE_SIZE;
if(ioctl(tdfx_fd,TDFX_VID_AGP_MOVE,&mov)) {
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_AgpMoveFailedOnVPlane);
break;
}
break;
default:
mp_msg(MSGT_VO,MSGL_WARN, MSGTR_LIBVO_TDFXVID_UnknownFormat,mpi->imgfmt);
return VO_TRUE;
}
return VO_TRUE;
}
static uint32_t fullscreen(void) {
vo_fs ^= 1;
aspect(&dst_width,&dst_height,vo_fs ? A_ZOOM : A_NOZOOM);
// This does not work :((
//clear_screen();
return VO_TRUE;
}
static uint32_t set_window(mp_win_t* w) {
if(!use_overlay) return VO_FALSE;
tdfx_ov.dst_x = w->x;
tdfx_ov.dst_y = w->y;
tdfx_ov.dst_width = w->w;
tdfx_ov.dst_height = w->h;
if(ioctl(tdfx_fd,TDFX_VID_SET_OVERLAY,&tdfx_ov))
mp_msg(MSGT_VO, MSGL_V, "tdfx_vid: set window failed\n");
return VO_TRUE;
}
static uint32_t set_colorkey(mp_colorkey_t* colork) {
if(!use_overlay) return VO_FALSE;
tdfx_ov.colorkey[0] = tdfx_ov.colorkey[1] = colork->x11;
tdfx_ov.use_colorkey = 1;
tdfx_ov.invert_colorkey = 0;
if(ioctl(tdfx_fd,TDFX_VID_SET_OVERLAY,&tdfx_ov))
mp_msg(MSGT_VO, MSGL_V, "tdfx_vid: set colorkey failed\n");
return VO_TRUE;
}
static int control(uint32_t request, void *data, ...)
{
switch (request) {
case VOCTRL_QUERY_FORMAT:
return query_format(*((uint32_t*)data));
case VOCTRL_GET_IMAGE:
return get_image(data);
case VOCTRL_DRAW_IMAGE:
return draw_image(data);
case VOCTRL_START_SLICE:
return start_slice(data);
case VOCTRL_FULLSCREEN:
return fullscreen();
case VOCTRL_XOVERLAY_SUPPORT:
return VO_TRUE;
case VOCTRL_XOVERLAY_SET_COLORKEY:
return set_colorkey(data);
case VOCTRL_XOVERLAY_SET_WIN:
return set_window(data);
}
return VO_NOTIMPL;
}