0,0 → 1,458 |
/* |
* Copyright 2008 Advanced Micro Devices, Inc. |
* Copyright 2008 Red Hat Inc. |
* Copyright 2009 Jerome Glisse. |
* |
* Permission is hereby granted, free of charge, to any person obtaining a |
* copy of this software and associated documentation files (the "Software"), |
* to deal in the Software without restriction, including without limitation |
* the rights to use, copy, modify, merge, publish, distribute, sublicense, |
* and/or sell copies of the Software, and to permit persons to whom the |
* Software is furnished to do so, subject to the following conditions: |
* |
* The above copyright notice and this permission notice shall be included in |
* all copies or substantial portions of the Software. |
* |
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
* THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
* OTHER DEALINGS IN THE SOFTWARE. |
* |
* Authors: Dave Airlie |
* Alex Deucher |
* Jerome Glisse |
*/ |
#include "drmP.h" |
#include "drm.h" |
#include "radeon_drm.h" |
#include "radeon_reg.h" |
#include "radeon.h" |
|
#include "r200_reg_safe.h" |
|
//#include "r100_track.h" |
|
#if 0 |
static int r200_get_vtx_size_0(uint32_t vtx_fmt_0) |
{ |
int vtx_size, i; |
vtx_size = 2; |
|
if (vtx_fmt_0 & R200_VTX_Z0) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_W0) |
vtx_size++; |
/* blend weight */ |
if (vtx_fmt_0 & (0x7 << R200_VTX_WEIGHT_COUNT_SHIFT)) |
vtx_size += (vtx_fmt_0 >> R200_VTX_WEIGHT_COUNT_SHIFT) & 0x7; |
if (vtx_fmt_0 & R200_VTX_PV_MATRIX_SEL) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_N0) |
vtx_size += 3; |
if (vtx_fmt_0 & R200_VTX_POINT_SIZE) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_DISCRETE_FOG) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_SHININESS_0) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_SHININESS_1) |
vtx_size++; |
for (i = 0; i < 8; i++) { |
int color_size = (vtx_fmt_0 >> (11 + 2*i)) & 0x3; |
switch (color_size) { |
case 0: break; |
case 1: vtx_size++; break; |
case 2: vtx_size += 3; break; |
case 3: vtx_size += 4; break; |
} |
} |
if (vtx_fmt_0 & R200_VTX_XY1) |
vtx_size += 2; |
if (vtx_fmt_0 & R200_VTX_Z1) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_W1) |
vtx_size++; |
if (vtx_fmt_0 & R200_VTX_N1) |
vtx_size += 3; |
return vtx_size; |
} |
|
static int r200_get_vtx_size_1(uint32_t vtx_fmt_1) |
{ |
int vtx_size, i, tex_size; |
vtx_size = 0; |
for (i = 0; i < 6; i++) { |
tex_size = (vtx_fmt_1 >> (i * 3)) & 0x7; |
if (tex_size > 4) |
continue; |
vtx_size += tex_size; |
} |
return vtx_size; |
} |
|
int r200_packet0_check(struct radeon_cs_parser *p, |
struct radeon_cs_packet *pkt, |
unsigned idx, unsigned reg) |
{ |
struct radeon_cs_chunk *ib_chunk; |
struct radeon_cs_reloc *reloc; |
struct r100_cs_track *track; |
volatile uint32_t *ib; |
uint32_t tmp; |
int r; |
int i; |
int face; |
u32 tile_flags = 0; |
|
ib = p->ib->ptr; |
ib_chunk = &p->chunks[p->chunk_ib_idx]; |
track = (struct r100_cs_track *)p->track; |
|
switch (reg) { |
case RADEON_CRTC_GUI_TRIG_VLINE: |
r = r100_cs_packet_parse_vline(p); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
break; |
/* FIXME: only allow PACKET3 blit? easier to check for out of |
* range access */ |
case RADEON_DST_PITCH_OFFSET: |
case RADEON_SRC_PITCH_OFFSET: |
r = r100_reloc_pitch_offset(p, pkt, idx, reg); |
if (r) |
return r; |
break; |
case RADEON_RB3D_DEPTHOFFSET: |
r = r100_cs_packet_next_reloc(p, &reloc); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
track->zb.robj = reloc->robj; |
track->zb.offset = ib_chunk->kdata[idx]; |
ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); |
break; |
case RADEON_RB3D_COLOROFFSET: |
r = r100_cs_packet_next_reloc(p, &reloc); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
track->cb[0].robj = reloc->robj; |
track->cb[0].offset = ib_chunk->kdata[idx]; |
ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); |
break; |
case R200_PP_TXOFFSET_0: |
case R200_PP_TXOFFSET_1: |
case R200_PP_TXOFFSET_2: |
case R200_PP_TXOFFSET_3: |
case R200_PP_TXOFFSET_4: |
case R200_PP_TXOFFSET_5: |
i = (reg - R200_PP_TXOFFSET_0) / 24; |
r = r100_cs_packet_next_reloc(p, &reloc); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); |
track->textures[i].robj = reloc->robj; |
break; |
case R200_PP_CUBIC_OFFSET_F1_0: |
case R200_PP_CUBIC_OFFSET_F2_0: |
case R200_PP_CUBIC_OFFSET_F3_0: |
case R200_PP_CUBIC_OFFSET_F4_0: |
case R200_PP_CUBIC_OFFSET_F5_0: |
case R200_PP_CUBIC_OFFSET_F1_1: |
case R200_PP_CUBIC_OFFSET_F2_1: |
case R200_PP_CUBIC_OFFSET_F3_1: |
case R200_PP_CUBIC_OFFSET_F4_1: |
case R200_PP_CUBIC_OFFSET_F5_1: |
case R200_PP_CUBIC_OFFSET_F1_2: |
case R200_PP_CUBIC_OFFSET_F2_2: |
case R200_PP_CUBIC_OFFSET_F3_2: |
case R200_PP_CUBIC_OFFSET_F4_2: |
case R200_PP_CUBIC_OFFSET_F5_2: |
case R200_PP_CUBIC_OFFSET_F1_3: |
case R200_PP_CUBIC_OFFSET_F2_3: |
case R200_PP_CUBIC_OFFSET_F3_3: |
case R200_PP_CUBIC_OFFSET_F4_3: |
case R200_PP_CUBIC_OFFSET_F5_3: |
case R200_PP_CUBIC_OFFSET_F1_4: |
case R200_PP_CUBIC_OFFSET_F2_4: |
case R200_PP_CUBIC_OFFSET_F3_4: |
case R200_PP_CUBIC_OFFSET_F4_4: |
case R200_PP_CUBIC_OFFSET_F5_4: |
case R200_PP_CUBIC_OFFSET_F1_5: |
case R200_PP_CUBIC_OFFSET_F2_5: |
case R200_PP_CUBIC_OFFSET_F3_5: |
case R200_PP_CUBIC_OFFSET_F4_5: |
case R200_PP_CUBIC_OFFSET_F5_5: |
i = (reg - R200_PP_TXOFFSET_0) / 24; |
face = (reg - ((i * 24) + R200_PP_TXOFFSET_0)) / 4; |
r = r100_cs_packet_next_reloc(p, &reloc); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
track->textures[i].cube_info[face - 1].offset = ib_chunk->kdata[idx]; |
ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); |
track->textures[i].cube_info[face - 1].robj = reloc->robj; |
break; |
case RADEON_RE_WIDTH_HEIGHT: |
track->maxy = ((ib_chunk->kdata[idx] >> 16) & 0x7FF); |
break; |
case RADEON_RB3D_COLORPITCH: |
r = r100_cs_packet_next_reloc(p, &reloc); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
|
if (reloc->lobj.tiling_flags & RADEON_TILING_MACRO) |
tile_flags |= RADEON_COLOR_TILE_ENABLE; |
if (reloc->lobj.tiling_flags & RADEON_TILING_MICRO) |
tile_flags |= RADEON_COLOR_MICROTILE_ENABLE; |
|
tmp = ib_chunk->kdata[idx] & ~(0x7 << 16); |
tmp |= tile_flags; |
ib[idx] = tmp; |
|
track->cb[0].pitch = ib_chunk->kdata[idx] & RADEON_COLORPITCH_MASK; |
break; |
case RADEON_RB3D_DEPTHPITCH: |
track->zb.pitch = ib_chunk->kdata[idx] & RADEON_DEPTHPITCH_MASK; |
break; |
case RADEON_RB3D_CNTL: |
switch ((ib_chunk->kdata[idx] >> RADEON_RB3D_COLOR_FORMAT_SHIFT) & 0x1f) { |
case 7: |
case 8: |
case 9: |
case 11: |
case 12: |
track->cb[0].cpp = 1; |
break; |
case 3: |
case 4: |
case 15: |
track->cb[0].cpp = 2; |
break; |
case 6: |
track->cb[0].cpp = 4; |
break; |
default: |
DRM_ERROR("Invalid color buffer format (%d) !\n", |
((ib_chunk->kdata[idx] >> RADEON_RB3D_COLOR_FORMAT_SHIFT) & 0x1f)); |
return -EINVAL; |
} |
if (ib_chunk->kdata[idx] & RADEON_DEPTHXY_OFFSET_ENABLE) { |
DRM_ERROR("No support for depth xy offset in kms\n"); |
return -EINVAL; |
} |
|
track->z_enabled = !!(ib_chunk->kdata[idx] & RADEON_Z_ENABLE); |
break; |
case RADEON_RB3D_ZSTENCILCNTL: |
switch (ib_chunk->kdata[idx] & 0xf) { |
case 0: |
track->zb.cpp = 2; |
break; |
case 2: |
case 3: |
case 4: |
case 5: |
case 9: |
case 11: |
track->zb.cpp = 4; |
break; |
default: |
break; |
} |
break; |
case RADEON_RB3D_ZPASS_ADDR: |
r = r100_cs_packet_next_reloc(p, &reloc); |
if (r) { |
DRM_ERROR("No reloc for ib[%d]=0x%04X\n", |
idx, reg); |
r100_cs_dump_packet(p, pkt); |
return r; |
} |
ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); |
break; |
case RADEON_PP_CNTL: |
{ |
uint32_t temp = ib_chunk->kdata[idx] >> 4; |
for (i = 0; i < track->num_texture; i++) |
track->textures[i].enabled = !!(temp & (1 << i)); |
} |
break; |
case RADEON_SE_VF_CNTL: |
track->vap_vf_cntl = ib_chunk->kdata[idx]; |
break; |
case 0x210c: |
/* VAP_VF_MAX_VTX_INDX */ |
track->max_indx = ib_chunk->kdata[idx] & 0x00FFFFFFUL; |
break; |
case R200_SE_VTX_FMT_0: |
track->vtx_size = r200_get_vtx_size_0(ib_chunk->kdata[idx]); |
break; |
case R200_SE_VTX_FMT_1: |
track->vtx_size += r200_get_vtx_size_1(ib_chunk->kdata[idx]); |
break; |
case R200_PP_TXSIZE_0: |
case R200_PP_TXSIZE_1: |
case R200_PP_TXSIZE_2: |
case R200_PP_TXSIZE_3: |
case R200_PP_TXSIZE_4: |
case R200_PP_TXSIZE_5: |
i = (reg - R200_PP_TXSIZE_0) / 32; |
track->textures[i].width = (ib_chunk->kdata[idx] & RADEON_TEX_USIZE_MASK) + 1; |
track->textures[i].height = ((ib_chunk->kdata[idx] & RADEON_TEX_VSIZE_MASK) >> RADEON_TEX_VSIZE_SHIFT) + 1; |
break; |
case R200_PP_TXPITCH_0: |
case R200_PP_TXPITCH_1: |
case R200_PP_TXPITCH_2: |
case R200_PP_TXPITCH_3: |
case R200_PP_TXPITCH_4: |
case R200_PP_TXPITCH_5: |
i = (reg - R200_PP_TXPITCH_0) / 32; |
track->textures[i].pitch = ib_chunk->kdata[idx] + 32; |
break; |
case R200_PP_TXFILTER_0: |
case R200_PP_TXFILTER_1: |
case R200_PP_TXFILTER_2: |
case R200_PP_TXFILTER_3: |
case R200_PP_TXFILTER_4: |
case R200_PP_TXFILTER_5: |
i = (reg - R200_PP_TXFILTER_0) / 32; |
track->textures[i].num_levels = ((ib_chunk->kdata[idx] & R200_MAX_MIP_LEVEL_MASK) |
>> R200_MAX_MIP_LEVEL_SHIFT); |
tmp = (ib_chunk->kdata[idx] >> 23) & 0x7; |
if (tmp == 2 || tmp == 6) |
track->textures[i].roundup_w = false; |
tmp = (ib_chunk->kdata[idx] >> 27) & 0x7; |
if (tmp == 2 || tmp == 6) |
track->textures[i].roundup_h = false; |
break; |
case R200_PP_TXMULTI_CTL_0: |
case R200_PP_TXMULTI_CTL_1: |
case R200_PP_TXMULTI_CTL_2: |
case R200_PP_TXMULTI_CTL_3: |
case R200_PP_TXMULTI_CTL_4: |
case R200_PP_TXMULTI_CTL_5: |
i = (reg - R200_PP_TXMULTI_CTL_0) / 32; |
break; |
case R200_PP_TXFORMAT_X_0: |
case R200_PP_TXFORMAT_X_1: |
case R200_PP_TXFORMAT_X_2: |
case R200_PP_TXFORMAT_X_3: |
case R200_PP_TXFORMAT_X_4: |
case R200_PP_TXFORMAT_X_5: |
i = (reg - R200_PP_TXFORMAT_X_0) / 32; |
track->textures[i].txdepth = ib_chunk->kdata[idx] & 0x7; |
tmp = (ib_chunk->kdata[idx] >> 16) & 0x3; |
/* 2D, 3D, CUBE */ |
switch (tmp) { |
case 0: |
case 5: |
case 6: |
case 7: |
track->textures[i].tex_coord_type = 0; |
break; |
case 1: |
track->textures[i].tex_coord_type = 1; |
break; |
case 2: |
track->textures[i].tex_coord_type = 2; |
break; |
} |
break; |
case R200_PP_TXFORMAT_0: |
case R200_PP_TXFORMAT_1: |
case R200_PP_TXFORMAT_2: |
case R200_PP_TXFORMAT_3: |
case R200_PP_TXFORMAT_4: |
case R200_PP_TXFORMAT_5: |
i = (reg - R200_PP_TXFORMAT_0) / 32; |
if (ib_chunk->kdata[idx] & R200_TXFORMAT_NON_POWER2) { |
track->textures[i].use_pitch = 1; |
} else { |
track->textures[i].use_pitch = 0; |
track->textures[i].width = 1 << ((ib_chunk->kdata[idx] >> RADEON_TXFORMAT_WIDTH_SHIFT) & RADEON_TXFORMAT_WIDTH_MASK); |
track->textures[i].height = 1 << ((ib_chunk->kdata[idx] >> RADEON_TXFORMAT_HEIGHT_SHIFT) & RADEON_TXFORMAT_HEIGHT_MASK); |
} |
switch ((ib_chunk->kdata[idx] & RADEON_TXFORMAT_FORMAT_MASK)) { |
case R200_TXFORMAT_I8: |
case R200_TXFORMAT_RGB332: |
case R200_TXFORMAT_Y8: |
track->textures[i].cpp = 1; |
break; |
case R200_TXFORMAT_DXT1: |
case R200_TXFORMAT_AI88: |
case R200_TXFORMAT_ARGB1555: |
case R200_TXFORMAT_RGB565: |
case R200_TXFORMAT_ARGB4444: |
case R200_TXFORMAT_VYUY422: |
case R200_TXFORMAT_YVYU422: |
case R200_TXFORMAT_LDVDU655: |
case R200_TXFORMAT_DVDU88: |
case R200_TXFORMAT_AVYU4444: |
track->textures[i].cpp = 2; |
break; |
case R200_TXFORMAT_ARGB8888: |
case R200_TXFORMAT_RGBA8888: |
case R200_TXFORMAT_ABGR8888: |
case R200_TXFORMAT_BGR111110: |
case R200_TXFORMAT_LDVDU8888: |
case R200_TXFORMAT_DXT23: |
case R200_TXFORMAT_DXT45: |
track->textures[i].cpp = 4; |
break; |
} |
track->textures[i].cube_info[4].width = 1 << ((ib_chunk->kdata[idx] >> 16) & 0xf); |
track->textures[i].cube_info[4].height = 1 << ((ib_chunk->kdata[idx] >> 20) & 0xf); |
break; |
case R200_PP_CUBIC_FACES_0: |
case R200_PP_CUBIC_FACES_1: |
case R200_PP_CUBIC_FACES_2: |
case R200_PP_CUBIC_FACES_3: |
case R200_PP_CUBIC_FACES_4: |
case R200_PP_CUBIC_FACES_5: |
tmp = ib_chunk->kdata[idx]; |
i = (reg - R200_PP_CUBIC_FACES_0) / 32; |
for (face = 0; face < 4; face++) { |
track->textures[i].cube_info[face].width = 1 << ((tmp >> (face * 8)) & 0xf); |
track->textures[i].cube_info[face].height = 1 << ((tmp >> ((face * 8) + 4)) & 0xf); |
} |
break; |
default: |
printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n", |
reg, idx); |
return -EINVAL; |
} |
return 0; |
} |
#endif |
|
int r200_init(struct radeon_device *rdev) |
{ |
rdev->config.r100.reg_safe_bm = r200_reg_safe_bm; |
rdev->config.r100.reg_safe_bm_size = ARRAY_SIZE(r200_reg_safe_bm); |
return 0; |
} |