/* Written by Rudolf Cornelissen 05/2002-4/2004 */ /* Note on 'missing features' in BeOS 5.0.3 and DANO: * BeOS needs to define more colorspaces! It would be nice if BeOS would support the FourCC 'definitions' * of colorspaces. These colorspaces are 32bit words, so it could be simply done (or is it already so?) */ #define MODULE_BIT 0x00000400 #include "acc_std.h" /* define the supported overlay input colorspaces */ /* It would be nice to have the YUV4:2:0 2-plane mode implemented also later on, but the Be colorspace * definitions (in GraphicsDefs.h, R5.0.3 and DANO5.1d0) do not include this one... */ static uint32 overlay_colorspaces [] = { (uint32)B_YCbCr422, (uint32)B_NO_COLOR_SPACE }; uint32 OVERLAY_COUNT(const display_mode *dm) // This method is never used AFAIK though it *is* exported on R5.0.3 and DANO. // Does someone know howto invoke it? { LOG(4,("Overlay: count called\n")); /* check for NULL pointer */ if (dm == NULL) { LOG(4,("Overlay: No display mode specified!\n")); } /* apparantly overlay count should report the number of 'overlay units' on the card */ return 1; } const uint32 *OVERLAY_SUPPORTED_SPACES(const display_mode *dm) // This method is never used AFAIK though it *is* exported on R5.0.3 and DANO. // Does someone know howto invoke it? { LOG(4,("Overlay: supported_spaces called.\n")); /* check for NULL pointer */ if (dm == NULL) { LOG(4,("Overlay: No display mode specified!\n")); return NULL; } /* assuming interlaced VGA is not supported */ if (dm->timing.flags && B_TIMING_INTERLACED) { return NULL; } /* return a B_NO_COLOR_SPACE terminated list */ return &overlay_colorspaces[0]; } uint32 OVERLAY_SUPPORTED_FEATURES(uint32 a_color_space) // This method is never used AFAIK. On R5.0.3 and DANO it is not even exported! { LOG(4,("Overlay: supported_features: color_space $%08x\n",a_color_space)); /* check what features are supported for the current overlaybitmap colorspace */ switch (a_color_space) { default: return ( B_OVERLAY_KEYING_USES_ALPHA | B_OVERLAY_COLOR_KEY | B_OVERLAY_HORIZONTAL_FILTERING | B_OVERLAY_VERTICAL_FILTERING ); } } const overlay_buffer *ALLOCATE_OVERLAY_BUFFER(color_space cs, uint16 width, uint16 height) { int offset = 0; /* used to determine next buffer to create */ uint32 adress, adress2, temp32; /* used to calculate buffer adresses */ uint32 oldsize = 0; /* used to 'squeeze' new buffers between already existing ones */ int cnt; /* loopcounter */ /* acquire the shared benaphore */ AQUIRE_BEN(si->overlay.lock) LOG(4,("Overlay: cardRAM_start = $%08x\n",(uint32)((uint8*)si->framebuffer))); LOG(4,("Overlay: cardRAM_start_DMA = $%08x\n",(uint32)((uint8*)si->framebuffer_pci))); LOG(4,("Overlay: cardRAM_size = %dMb\n",si->ps.memory_size)); /* find first empty slot (room for another buffer?) */ for (offset = 0; offset < MAXBUFFERS; offset++) { if (si->overlay.myBuffer[offset].buffer == NULL) break; } LOG(4,("Overlay: Allocate_buffer offset = %d\n",offset)); if (offset < MAXBUFFERS) /* setup new scaler input buffer */ { switch (cs) { case B_YCbCr422: if (si->ps.card_arch < NV10A) { /* check if slopspace is needed: RIVA128 and TNT need ~0x000f. */ si->overlay.myBuffer[offset].width = ((width + 0x000f) & ~0x000f); } else { /* check if slopspace is needed: GeForce need ~0x001f. */ /* fixme: * update needed for GF DVDmax support to adhere to CRTC2 constraints?? */ si->overlay.myBuffer[offset].width = ((width + 0x001f) & ~0x001f); } si->overlay.myBuffer[offset].bytes_per_row = 2 * si->overlay.myBuffer[offset].width; /* check if the requested horizontal pitch is supported: */ //fixme: tune for GF and TNT... if (si->overlay.myBuffer[offset].width > 4088) { LOG(4,("Overlay: Sorry, requested buffer pitch not supported, aborted\n")); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } break; default: /* unsupported colorspace! */ LOG(4,("Overlay: Sorry, colorspace $%08x not supported, aborted\n",cs)); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; break; } /* check if the requested buffer width is supported */ if (si->overlay.myBuffer[offset].width > 1024) { LOG(4,("Overlay: Sorry, requested buffer width not supported, aborted\n")); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } /* check if the requested buffer height is supported */ if (height > 1024) { LOG(4,("Overlay: Sorry, requested buffer height not supported, aborted\n")); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } /* store slopspace (in pixels) for each bitmap for use by 'overlay unit' (BES) */ si->overlay.myBufInfo[offset].slopspace = si->overlay.myBuffer[offset].width - width; si->overlay.myBuffer[offset].space = cs; si->overlay.myBuffer[offset].height = height; /* we define the overlay buffers to reside 'in the back' of the cards RAM */ /* NOTE to app programmers: * Beware that an app using overlay needs to track workspace switches and screenprefs * changes. If such an action is detected, the app needs to reset it's pointers to the * newly created overlay bitmaps, which will be assigned by BeOS automatically after such * an event. (Also the app needs to respect the new overlay_constraints that will be applicable!) * * It is entirely possible that new bitmaps may *not* be re-setup at all, or less of them * than previously setup by the app might be re-setup. This is due to cardRAM restraints then. * This means that the app should also check for NULL pointers returned by the bitmaps, * and if this happens, it needs to fallback to single buffered overlay or even fallback to * bitmap output for the new situation. */ /* Another NOTE for app programmers: * A *positive* side-effect of assigning the first overlay buffer exactly at the end of the * cardRAM is that apps that try to write beyond the buffer's space get a segfault immediately. * This *greatly* simplifies tracking such errors! * Of course such errors may lead to strange effects in the app or driver behaviour if they are * not hunted down and removed.. */ /* calculate first free RAM adress in card: * Driver setup is as follows: * card base: - hardware cursor bitmap (if used), * directly above - screen memory for both heads */ adress2 = (((uint32)((uint8*)si->fbc.frame_buffer)) + /* cursor already included here */ (si->fbc.bytes_per_row * si->dm.virtual_height)); /* size in bytes of screen(s) */ LOG(4,("Overlay: first free cardRAM virtual adress $%08x\n", adress2)); /* calculate 'preliminary' buffer size including slopspace */ oldsize = si->overlay.myBufInfo[offset].size; si->overlay.myBufInfo[offset].size = si->overlay.myBuffer[offset].bytes_per_row * si->overlay.myBuffer[offset].height; /* calculate virtual memory adress that would be needed for a new bitmap */ /* NOTE to app programmers: * For testing app behaviour regarding workspace switches or screen prefs changes to settings * that do not have enough cardRAM left for allocation of overlay bitmaps, you need a card with * a low amount of RAM. Or you can set in the file nv.settings for example: * memory 8 #8Mb RAM on card * and reboot (this simulates 8Mb RAM on the card). * * If you switch now to settings: 1600x1200x32bit (single head) the app needs to fallback to * bitmap output or maybe single buffered overlay output if small bitmaps are used. */ adress = (((uint32)((uint8*)si->framebuffer)) + (si->ps.memory_size * 1024 * 1024)); for (cnt = 0; cnt <= offset; cnt++) { adress -= si->overlay.myBufInfo[cnt].size; } /* the > G200 scalers require buffers to be aligned to 16 byte pages cardRAM offset, G200 can do with * 8 byte pages cardRAM offset. Compatible settings used, has no real downside consequences here */ /* Check if we need to modify the buffers starting adress and thus the size */ /* calculate 'would be' cardRAM offset */ temp32 = (adress - ((uint32)((vuint32 *)si->framebuffer))); /* check if it is aligned */ if (temp32 != (temp32 & 0xfffffff0)) { /* update the (already calculated) buffersize to get it aligned */ si->overlay.myBufInfo[offset].size += (temp32 - (temp32 & 0xfffffff0)); /* update the (already calculated) adress to get it aligned */ adress -= (temp32 - (temp32 & 0xfffffff0)); } LOG(4,("Overlay: new buffer needs virtual adress $%08x\n", adress)); /* First check now if buffer to be defined is 'last one' in memory (speaking backwards): * this is done to prevent a large buffer getting created in the space a small buffer * occupied earlier, if not all buffers created were deleted. * Note also that the app can delete the buffers in any order desired. */ /* NOTE to app programmers: * If you are going to delete a overlay buffer you created, you should delete them *all* and * then re-create only the new ones needed. This way you are sure not to get unused memory- * space in between your overlay buffers for instance, so cardRAM is used 'to the max'. * If you don't, you might not get a buffer at all if you are trying to set up a larger one * than before. * (Indeed: not all buffers *have* to be of the same type and size...) */ for (cnt = offset; cnt < MAXBUFFERS; cnt++) { if (si->overlay.myBuffer[cnt].buffer != NULL) { /* Check if the new buffer would fit into the space the single old one used here */ if (si->overlay.myBufInfo[offset].size <= oldsize) { /* It does, so we reset to the old size and adresses to prevent the space from shrinking * if we get here again... */ adress -= (oldsize - si->overlay.myBufInfo[offset].size); si->overlay.myBufInfo[offset].size = oldsize; LOG(4,("Overlay: 'squeezing' in buffer:\n" "Overlay: resetting it to virtual adress $%08x and size $%08x\n", adress,oldsize)); /* force exiting the FOR loop */ cnt = MAXBUFFERS; } else { /* nogo, sorry */ LOG(4,("Overlay: Other buffer(s) exist after this one:\n" "Overlay: not enough space to 'squeeze' this one in, aborted\n")); /* Reset to the old size to prevent the space from 'growing' if we get here again... */ si->overlay.myBufInfo[offset].size = oldsize; /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } } } /* check if we have enough space to setup this new bitmap * (preventing overlap of desktop RAMspace & overlay bitmap RAMspace here) */ if (adress < adress2) /* nope, sorry */ { LOG(4,("Overlay: Sorry, no more space for buffers: aborted\n")); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } /* continue buffer setup */ si->overlay.myBuffer[offset].buffer = (void *) adress; /* calculate physical memory adress (for dma use) */ adress = (((uint32)((uint8*)si->framebuffer_pci)) + (si->ps.memory_size * 1024 * 1024)); for (cnt = 0; cnt <= offset; cnt++) { adress -= si->overlay.myBufInfo[cnt].size; } /* this adress is already aligned to the scaler's requirements (via the already modified sizes) */ si->overlay.myBuffer[offset].buffer_dma = (void *) adress; LOG(4,("Overlay: New buffer: addr $%08x, dma_addr $%08x, color space $%08x\n", (uint32)((uint8*)si->overlay.myBuffer[offset].buffer), (uint32)((uint8*)si->overlay.myBuffer[offset].buffer_dma), cs)); LOG(4,("Overlay: New buffer's size is $%08x\n", si->overlay.myBufInfo[offset].size)); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return &si->overlay.myBuffer[offset]; } else /* sorry, no more room for buffers */ { LOG(4,("Overlay: Sorry, no more space for buffers: aborted\n")); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } } status_t RELEASE_OVERLAY_BUFFER(const overlay_buffer *ob) /* Note that the user can delete the buffers in any order desired! */ { int offset = 0; if (ob != NULL) { /* find the buffer */ for (offset = 0; offset < MAXBUFFERS; offset++) { if (si->overlay.myBuffer[offset].buffer == ob->buffer) break; } if (offset < MAXBUFFERS) /* delete current buffer */ { si->overlay.myBuffer[offset].buffer = NULL; si->overlay.myBuffer[offset].buffer_dma = NULL; LOG(4,("Overlay: Release_buffer offset = %d, buffer released\n",offset)); return B_OK; } else { /* this is no buffer of ours! */ LOG(4,("Overlay: Release_overlay_buffer: not ours, aborted!\n")); return B_ERROR; } } else /* no buffer specified! */ { LOG(4,("Overlay: Release_overlay_buffer: no buffer specified, aborted!\n")); return B_ERROR; } } status_t GET_OVERLAY_CONSTRAINTS (const display_mode *dm, const overlay_buffer *ob, overlay_constraints *oc) { int offset = 0; LOG(4,("Overlay: Get_overlay_constraints called\n")); /* check for NULL pointers */ if ((dm == NULL) || (ob == NULL) || (oc == NULL)) { LOG(4,("Overlay: Get_overlay_constraints: Null pointer(s) detected!\n")); return B_ERROR; } /* find the buffer */ for (offset = 0; offset < MAXBUFFERS; offset++) { if (si->overlay.myBuffer[offset].buffer == ob->buffer) break; } if (offset < MAXBUFFERS) { /* scaler input (values are in pixels) */ oc->view.h_alignment = 0; oc->view.v_alignment = 0; switch (ob->space) { case B_YCbCr422: if (si->ps.card_arch < NV10A) { /* RIVA128 and TNT need 15. * Note: this has to be in sync with the slopspace setup during buffer allocation.. */ oc->view.width_alignment = 15; } else { /* GeForce need 31. * Note: this has to be in sync with the slopspace setup during buffer allocation.. */ oc->view.width_alignment = 31; } break; default: /* we should not be here, but set the worst-case value just to be safe anyway */ oc->view.width_alignment = 31; break; } oc->view.height_alignment = 0; oc->view.width.min = 1; oc->view.height.min = 2; /* two fields */ oc->view.width.max = ob->width; oc->view.height.max = ob->height; /* scaler output restrictions */ oc->window.h_alignment = 0; oc->window.v_alignment = 0; oc->window.width_alignment = 0; oc->window.height_alignment = 0; oc->window.width.min = 2; /* GeForce cards can output upto and including 2046 pixels in width */ //fixme: how about TNT? if (dm->virtual_width > 2046) { oc->window.width.max = 2046; } else { oc->window.width.max = dm->virtual_width; } oc->window.height.min = 2; /* GeForce cards can output upto and including 2046 pixels in height */ //fixme: how about TNT? if (dm->virtual_height > 2046) { oc->window.height.max = 2046; } else { oc->window.height.max = dm->virtual_height; } /* GeForce scaling restrictions */ switch (si->ps.card_arch) { case NV04A: /* Riva128-TNT2 series have an old BES engine... */ oc->h_scale.min = 1.0; oc->v_scale.min = 1.0; break; case NV30A: /* GeForceFX series have a new BES engine... */ oc->h_scale.min = 0.5; oc->v_scale.min = 0.5; /* NV31 (confirmed GeForceFX 5600) has NV20A scaling limits! * So let it fall through... */ if (si->ps.card_type != NV31) break; default: /* the rest in between... */ oc->h_scale.min = 0.125; oc->v_scale.min = 0.125; break; } /* all cards have a upscaling limit of 8.0 (see official nVidia specsheets) */ oc->h_scale.max = 8.0; oc->v_scale.max = 8.0; return B_OK; } else { /* this is no buffer of ours! */ LOG(4,("Overlay: Get_overlay_constraints: buffer is not ours, aborted!\n")); return B_ERROR; } } overlay_token ALLOCATE_OVERLAY(void) { uint32 tmpToken; LOG(4,("Overlay: Allocate_overlay called: ")); /* come up with a token */ tmpToken = 0x12345678; /* acquire the shared benaphore */ AQUIRE_BEN(si->overlay.lock) /* overlay unit already in use? */ if (si->overlay.myToken == NULL) /* overlay unit is available */ { LOG(4,("succesfull\n")); si->overlay.myToken = &tmpToken; /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return si->overlay.myToken; } else /* sorry, overlay unit is occupied */ { LOG(4,("failed: already in use!\n")); /* release the shared benaphore */ RELEASE_BEN(si->overlay.lock) return NULL; } } status_t RELEASE_OVERLAY(overlay_token ot) { LOG(4,("Overlay: Release_overlay called: ")); /* is this call for real? */ if ((ot == NULL) || (si->overlay.myToken == NULL) || (ot != si->overlay.myToken)) /* nope, abort */ { LOG(4,("failed, not in use!\n")); return B_ERROR; } else /* call is for real */ { nv_release_bes(); LOG(4,("succesfull\n")); si->overlay.myToken = NULL; return B_OK; } } status_t CONFIGURE_OVERLAY (overlay_token ot, const overlay_buffer *ob, const overlay_window *ow, const overlay_view *ov) { int offset = 0; /* used for buffer index */ LOG(4,("Overlay: Configure_overlay called: ")); /* Note: * When a Workspace switch, screen prefs change, or overlay app shutdown occurs, BeOS will * release all overlay buffers. The buffer currently displayed at that moment, may need some * 'hardware releasing' in the CONFIGURE_OVERLAY routine. This is why CONFIGURE_OVERLAY gets * called one more time then, with a null pointer for overlay_window and overlay_view, while * the currently displayed overlay_buffer is given. * The G200-G550 do not need to do anything on such an occasion, so we simply return if we * get called then. */ if ((ow == NULL) || (ov == NULL)) { LOG(4,("output properties changed\n")); return B_OK; } /* Note: * If during overlay use the screen prefs are changed, or the workspace has changed, it * may be that we were not able to re-allocate the requested overlay buffers (or only partly) * due to lack of cardRAM. If the app does not respond properly to this, we might end up * with a NULL pointer instead of a overlay_buffer to work with here. * Of course, we need to abort then to prevent the system from 'going down'. * The app will probably crash because it will want to write into this non-existant buffer * at some point. */ if (ob == NULL) { LOG(4,("no overlay buffer specified\n")); return B_ERROR; } /* is this call done by the app that owns us? */ if ((ot == NULL) || (si->overlay.myToken == NULL) || (ot != si->overlay.myToken)) /* nope, abort */ { LOG(4,("failed\n")); return B_ERROR; } else /* call is for real */ { /* find the buffer's offset */ for (offset = 0; offset < MAXBUFFERS; offset++) { if (si->overlay.myBuffer[offset].buffer == ob->buffer) break; } if (offset < MAXBUFFERS) { LOG(4,("succesfull, switching to buffer %d\n", offset)); /* do 'overlay follow head' in dualhead modes on dualhead cards */ if (si->ps.secondary_head) { switch (si->dm.flags & DUALHEAD_BITS) { case DUALHEAD_ON: case DUALHEAD_SWITCH: if ((ow->h_start + (ow->width / 2)) < (si->dm.h_display_start + si->dm.timing.h_display)) nv_bes_to_crtc(si->crtc_switch_mode); else nv_bes_to_crtc(!si->crtc_switch_mode); break; default: nv_bes_to_crtc(si->crtc_switch_mode); break; } } /* _now_ program overlay hardware */ nv_configure_bes(ob, ow, ov, offset); return B_OK; } else { /* this is no buffer of ours! */ LOG(4,("buffer is not ours, aborted!\n")); return B_ERROR; } } }