Subversion Repositories Kolibri OS

Rev

Rev 1221 | Go to most recent revision | Details | Last modification | View Log | RSS feed

Rev Author Line No. Line
1179 serge 1
/*
2
 * Copyright 2008 Advanced Micro Devices, Inc.
3
 * Copyright 2008 Red Hat Inc.
4
 * Copyright 2009 Jerome Glisse.
5
 *
6
 * Permission is hereby granted, free of charge, to any person obtaining a
7
 * copy of this software and associated documentation files (the "Software"),
8
 * to deal in the Software without restriction, including without limitation
9
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10
 * and/or sell copies of the Software, and to permit persons to whom the
11
 * Software is furnished to do so, subject to the following conditions:
12
 *
13
 * The above copyright notice and this permission notice shall be included in
14
 * all copies or substantial portions of the Software.
15
 *
16
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22
 * OTHER DEALINGS IN THE SOFTWARE.
23
 *
24
 * Authors: Dave Airlie
25
 *          Alex Deucher
26
 *          Jerome Glisse
27
 */
28
#include "drmP.h"
29
#include "drm.h"
30
#include "radeon_drm.h"
31
#include "radeon_reg.h"
32
#include "radeon.h"
33
 
34
#include "r200_reg_safe.h"
35
 
36
//#include "r100_track.h"
37
 
38
#if 0
39
static int r200_get_vtx_size_0(uint32_t vtx_fmt_0)
40
{
41
	int vtx_size, i;
42
	vtx_size = 2;
43
 
44
	if (vtx_fmt_0 & R200_VTX_Z0)
45
		vtx_size++;
46
	if (vtx_fmt_0 & R200_VTX_W0)
47
		vtx_size++;
48
	/* blend weight */
49
	if (vtx_fmt_0 & (0x7 << R200_VTX_WEIGHT_COUNT_SHIFT))
50
		vtx_size += (vtx_fmt_0 >> R200_VTX_WEIGHT_COUNT_SHIFT) & 0x7;
51
	if (vtx_fmt_0 & R200_VTX_PV_MATRIX_SEL)
52
		vtx_size++;
53
	if (vtx_fmt_0 & R200_VTX_N0)
54
		vtx_size += 3;
55
	if (vtx_fmt_0 & R200_VTX_POINT_SIZE)
56
		vtx_size++;
57
	if (vtx_fmt_0 & R200_VTX_DISCRETE_FOG)
58
		vtx_size++;
59
	if (vtx_fmt_0 & R200_VTX_SHININESS_0)
60
		vtx_size++;
61
	if (vtx_fmt_0 & R200_VTX_SHININESS_1)
62
		vtx_size++;
63
	for (i = 0; i < 8; i++) {
64
		int color_size = (vtx_fmt_0 >> (11 + 2*i)) & 0x3;
65
		switch (color_size) {
66
		case 0: break;
67
		case 1: vtx_size++; break;
68
		case 2: vtx_size += 3; break;
69
		case 3: vtx_size += 4; break;
70
		}
71
	}
72
	if (vtx_fmt_0 & R200_VTX_XY1)
73
		vtx_size += 2;
74
	if (vtx_fmt_0 & R200_VTX_Z1)
75
		vtx_size++;
76
	if (vtx_fmt_0 & R200_VTX_W1)
77
		vtx_size++;
78
	if (vtx_fmt_0 & R200_VTX_N1)
79
		vtx_size += 3;
80
	return vtx_size;
81
}
82
 
83
static int r200_get_vtx_size_1(uint32_t vtx_fmt_1)
84
{
85
	int vtx_size, i, tex_size;
86
	vtx_size = 0;
87
	for (i = 0; i < 6; i++) {
88
		tex_size = (vtx_fmt_1 >> (i * 3)) & 0x7;
89
		if (tex_size > 4)
90
			continue;
91
		vtx_size += tex_size;
92
	}
93
	return vtx_size;
94
}
95
 
96
int r200_packet0_check(struct radeon_cs_parser *p,
97
		       struct radeon_cs_packet *pkt,
98
		       unsigned idx, unsigned reg)
99
{
100
	struct radeon_cs_chunk *ib_chunk;
101
	struct radeon_cs_reloc *reloc;
102
	struct r100_cs_track *track;
103
	volatile uint32_t *ib;
104
	uint32_t tmp;
105
	int r;
106
	int i;
107
	int face;
108
	u32 tile_flags = 0;
109
 
110
	ib = p->ib->ptr;
111
	ib_chunk = &p->chunks[p->chunk_ib_idx];
112
	track = (struct r100_cs_track *)p->track;
113
 
114
	switch (reg) {
115
	case RADEON_CRTC_GUI_TRIG_VLINE:
116
		r = r100_cs_packet_parse_vline(p);
117
		if (r) {
118
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
119
				  idx, reg);
120
			r100_cs_dump_packet(p, pkt);
121
			return r;
122
		}
123
		break;
124
		/* FIXME: only allow PACKET3 blit? easier to check for out of
125
		 * range access */
126
	case RADEON_DST_PITCH_OFFSET:
127
	case RADEON_SRC_PITCH_OFFSET:
128
		r = r100_reloc_pitch_offset(p, pkt, idx, reg);
129
		if (r)
130
			return r;
131
		break;
132
	case RADEON_RB3D_DEPTHOFFSET:
133
		r = r100_cs_packet_next_reloc(p, &reloc);
134
		if (r) {
135
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
136
				  idx, reg);
137
			r100_cs_dump_packet(p, pkt);
138
			return r;
139
		}
140
		track->zb.robj = reloc->robj;
141
		track->zb.offset = ib_chunk->kdata[idx];
142
		ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
143
		break;
144
	case RADEON_RB3D_COLOROFFSET:
145
		r = r100_cs_packet_next_reloc(p, &reloc);
146
		if (r) {
147
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
148
				  idx, reg);
149
			r100_cs_dump_packet(p, pkt);
150
			return r;
151
		}
152
		track->cb[0].robj = reloc->robj;
153
		track->cb[0].offset = ib_chunk->kdata[idx];
154
		ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
155
		break;
156
	case R200_PP_TXOFFSET_0:
157
	case R200_PP_TXOFFSET_1:
158
	case R200_PP_TXOFFSET_2:
159
	case R200_PP_TXOFFSET_3:
160
	case R200_PP_TXOFFSET_4:
161
	case R200_PP_TXOFFSET_5:
162
		i = (reg - R200_PP_TXOFFSET_0) / 24;
163
		r = r100_cs_packet_next_reloc(p, &reloc);
164
		if (r) {
165
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
166
				  idx, reg);
167
			r100_cs_dump_packet(p, pkt);
168
			return r;
169
		}
170
		ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
171
		track->textures[i].robj = reloc->robj;
172
		break;
173
	case R200_PP_CUBIC_OFFSET_F1_0:
174
	case R200_PP_CUBIC_OFFSET_F2_0:
175
	case R200_PP_CUBIC_OFFSET_F3_0:
176
	case R200_PP_CUBIC_OFFSET_F4_0:
177
	case R200_PP_CUBIC_OFFSET_F5_0:
178
	case R200_PP_CUBIC_OFFSET_F1_1:
179
	case R200_PP_CUBIC_OFFSET_F2_1:
180
	case R200_PP_CUBIC_OFFSET_F3_1:
181
	case R200_PP_CUBIC_OFFSET_F4_1:
182
	case R200_PP_CUBIC_OFFSET_F5_1:
183
	case R200_PP_CUBIC_OFFSET_F1_2:
184
	case R200_PP_CUBIC_OFFSET_F2_2:
185
	case R200_PP_CUBIC_OFFSET_F3_2:
186
	case R200_PP_CUBIC_OFFSET_F4_2:
187
	case R200_PP_CUBIC_OFFSET_F5_2:
188
	case R200_PP_CUBIC_OFFSET_F1_3:
189
	case R200_PP_CUBIC_OFFSET_F2_3:
190
	case R200_PP_CUBIC_OFFSET_F3_3:
191
	case R200_PP_CUBIC_OFFSET_F4_3:
192
	case R200_PP_CUBIC_OFFSET_F5_3:
193
	case R200_PP_CUBIC_OFFSET_F1_4:
194
	case R200_PP_CUBIC_OFFSET_F2_4:
195
	case R200_PP_CUBIC_OFFSET_F3_4:
196
	case R200_PP_CUBIC_OFFSET_F4_4:
197
	case R200_PP_CUBIC_OFFSET_F5_4:
198
	case R200_PP_CUBIC_OFFSET_F1_5:
199
	case R200_PP_CUBIC_OFFSET_F2_5:
200
	case R200_PP_CUBIC_OFFSET_F3_5:
201
	case R200_PP_CUBIC_OFFSET_F4_5:
202
	case R200_PP_CUBIC_OFFSET_F5_5:
203
		i = (reg - R200_PP_TXOFFSET_0) / 24;
204
		face = (reg - ((i * 24) + R200_PP_TXOFFSET_0)) / 4;
205
		r = r100_cs_packet_next_reloc(p, &reloc);
206
		if (r) {
207
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
208
				  idx, reg);
209
			r100_cs_dump_packet(p, pkt);
210
			return r;
211
		}
212
		track->textures[i].cube_info[face - 1].offset = ib_chunk->kdata[idx];
213
		ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
214
		track->textures[i].cube_info[face - 1].robj = reloc->robj;
215
		break;
216
	case RADEON_RE_WIDTH_HEIGHT:
217
		track->maxy = ((ib_chunk->kdata[idx] >> 16) & 0x7FF);
218
		break;
219
	case RADEON_RB3D_COLORPITCH:
220
		r = r100_cs_packet_next_reloc(p, &reloc);
221
		if (r) {
222
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
223
				  idx, reg);
224
			r100_cs_dump_packet(p, pkt);
225
			return r;
226
		}
227
 
228
		if (reloc->lobj.tiling_flags & RADEON_TILING_MACRO)
229
			tile_flags |= RADEON_COLOR_TILE_ENABLE;
230
		if (reloc->lobj.tiling_flags & RADEON_TILING_MICRO)
231
			tile_flags |= RADEON_COLOR_MICROTILE_ENABLE;
232
 
233
		tmp = ib_chunk->kdata[idx] & ~(0x7 << 16);
234
		tmp |= tile_flags;
235
		ib[idx] = tmp;
236
 
237
		track->cb[0].pitch = ib_chunk->kdata[idx] & RADEON_COLORPITCH_MASK;
238
		break;
239
	case RADEON_RB3D_DEPTHPITCH:
240
		track->zb.pitch = ib_chunk->kdata[idx] & RADEON_DEPTHPITCH_MASK;
241
		break;
242
	case RADEON_RB3D_CNTL:
243
		switch ((ib_chunk->kdata[idx] >> RADEON_RB3D_COLOR_FORMAT_SHIFT) & 0x1f) {
244
		case 7:
245
		case 8:
246
		case 9:
247
		case 11:
248
		case 12:
249
			track->cb[0].cpp = 1;
250
			break;
251
		case 3:
252
		case 4:
253
		case 15:
254
			track->cb[0].cpp = 2;
255
			break;
256
		case 6:
257
			track->cb[0].cpp = 4;
258
			break;
259
		default:
260
			DRM_ERROR("Invalid color buffer format (%d) !\n",
261
				  ((ib_chunk->kdata[idx] >> RADEON_RB3D_COLOR_FORMAT_SHIFT) & 0x1f));
262
			return -EINVAL;
263
		}
264
		if (ib_chunk->kdata[idx] & RADEON_DEPTHXY_OFFSET_ENABLE) {
265
			DRM_ERROR("No support for depth xy offset in kms\n");
266
			return -EINVAL;
267
		}
268
 
269
		track->z_enabled = !!(ib_chunk->kdata[idx] & RADEON_Z_ENABLE);
270
		break;
271
	case RADEON_RB3D_ZSTENCILCNTL:
272
		switch (ib_chunk->kdata[idx] & 0xf) {
273
		case 0:
274
			track->zb.cpp = 2;
275
			break;
276
		case 2:
277
		case 3:
278
		case 4:
279
		case 5:
280
		case 9:
281
		case 11:
282
			track->zb.cpp = 4;
283
			break;
284
		default:
285
			break;
286
		}
287
		break;
288
	case RADEON_RB3D_ZPASS_ADDR:
289
		r = r100_cs_packet_next_reloc(p, &reloc);
290
		if (r) {
291
			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
292
				  idx, reg);
293
			r100_cs_dump_packet(p, pkt);
294
			return r;
295
		}
296
		ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
297
		break;
298
	case RADEON_PP_CNTL:
299
		{
300
			uint32_t temp = ib_chunk->kdata[idx] >> 4;
301
			for (i = 0; i < track->num_texture; i++)
302
				track->textures[i].enabled = !!(temp & (1 << i));
303
		}
304
		break;
305
	case RADEON_SE_VF_CNTL:
306
		track->vap_vf_cntl = ib_chunk->kdata[idx];
307
		break;
308
	case 0x210c:
309
		/* VAP_VF_MAX_VTX_INDX */
310
		track->max_indx = ib_chunk->kdata[idx] & 0x00FFFFFFUL;
311
		break;
312
	case R200_SE_VTX_FMT_0:
313
		track->vtx_size = r200_get_vtx_size_0(ib_chunk->kdata[idx]);
314
		break;
315
	case R200_SE_VTX_FMT_1:
316
		track->vtx_size += r200_get_vtx_size_1(ib_chunk->kdata[idx]);
317
		break;
318
	case R200_PP_TXSIZE_0:
319
	case R200_PP_TXSIZE_1:
320
	case R200_PP_TXSIZE_2:
321
	case R200_PP_TXSIZE_3:
322
	case R200_PP_TXSIZE_4:
323
	case R200_PP_TXSIZE_5:
324
		i = (reg - R200_PP_TXSIZE_0) / 32;
325
		track->textures[i].width = (ib_chunk->kdata[idx] & RADEON_TEX_USIZE_MASK) + 1;
326
		track->textures[i].height = ((ib_chunk->kdata[idx] & RADEON_TEX_VSIZE_MASK) >> RADEON_TEX_VSIZE_SHIFT) + 1;
327
		break;
328
	case R200_PP_TXPITCH_0:
329
	case R200_PP_TXPITCH_1:
330
	case R200_PP_TXPITCH_2:
331
	case R200_PP_TXPITCH_3:
332
	case R200_PP_TXPITCH_4:
333
	case R200_PP_TXPITCH_5:
334
		i = (reg - R200_PP_TXPITCH_0) / 32;
335
		track->textures[i].pitch = ib_chunk->kdata[idx] + 32;
336
		break;
337
	case R200_PP_TXFILTER_0:
338
	case R200_PP_TXFILTER_1:
339
	case R200_PP_TXFILTER_2:
340
	case R200_PP_TXFILTER_3:
341
	case R200_PP_TXFILTER_4:
342
	case R200_PP_TXFILTER_5:
343
		i = (reg - R200_PP_TXFILTER_0) / 32;
344
		track->textures[i].num_levels = ((ib_chunk->kdata[idx] & R200_MAX_MIP_LEVEL_MASK)
345
						 >> R200_MAX_MIP_LEVEL_SHIFT);
346
		tmp = (ib_chunk->kdata[idx] >> 23) & 0x7;
347
		if (tmp == 2 || tmp == 6)
348
			track->textures[i].roundup_w = false;
349
		tmp = (ib_chunk->kdata[idx] >> 27) & 0x7;
350
		if (tmp == 2 || tmp == 6)
351
			track->textures[i].roundup_h = false;
352
		break;
353
	case R200_PP_TXMULTI_CTL_0:
354
	case R200_PP_TXMULTI_CTL_1:
355
	case R200_PP_TXMULTI_CTL_2:
356
	case R200_PP_TXMULTI_CTL_3:
357
	case R200_PP_TXMULTI_CTL_4:
358
	case R200_PP_TXMULTI_CTL_5:
359
		i = (reg - R200_PP_TXMULTI_CTL_0) / 32;
360
		break;
361
	case R200_PP_TXFORMAT_X_0:
362
	case R200_PP_TXFORMAT_X_1:
363
	case R200_PP_TXFORMAT_X_2:
364
	case R200_PP_TXFORMAT_X_3:
365
	case R200_PP_TXFORMAT_X_4:
366
	case R200_PP_TXFORMAT_X_5:
367
		i = (reg - R200_PP_TXFORMAT_X_0) / 32;
368
		track->textures[i].txdepth = ib_chunk->kdata[idx] & 0x7;
369
		tmp = (ib_chunk->kdata[idx] >> 16) & 0x3;
370
		/* 2D, 3D, CUBE */
371
		switch (tmp) {
372
		case 0:
373
		case 5:
374
		case 6:
375
		case 7:
376
			track->textures[i].tex_coord_type = 0;
377
			break;
378
		case 1:
379
			track->textures[i].tex_coord_type = 1;
380
			break;
381
		case 2:
382
			track->textures[i].tex_coord_type = 2;
383
			break;
384
		}
385
		break;
386
	case R200_PP_TXFORMAT_0:
387
	case R200_PP_TXFORMAT_1:
388
	case R200_PP_TXFORMAT_2:
389
	case R200_PP_TXFORMAT_3:
390
	case R200_PP_TXFORMAT_4:
391
	case R200_PP_TXFORMAT_5:
392
		i = (reg - R200_PP_TXFORMAT_0) / 32;
393
		if (ib_chunk->kdata[idx] & R200_TXFORMAT_NON_POWER2) {
394
			track->textures[i].use_pitch = 1;
395
		} else {
396
			track->textures[i].use_pitch = 0;
397
			track->textures[i].width = 1 << ((ib_chunk->kdata[idx] >> RADEON_TXFORMAT_WIDTH_SHIFT) & RADEON_TXFORMAT_WIDTH_MASK);
398
			track->textures[i].height = 1 << ((ib_chunk->kdata[idx] >> RADEON_TXFORMAT_HEIGHT_SHIFT) & RADEON_TXFORMAT_HEIGHT_MASK);
399
		}
400
		switch ((ib_chunk->kdata[idx] & RADEON_TXFORMAT_FORMAT_MASK)) {
401
		case R200_TXFORMAT_I8:
402
		case R200_TXFORMAT_RGB332:
403
		case R200_TXFORMAT_Y8:
404
			track->textures[i].cpp = 1;
405
			break;
406
		case R200_TXFORMAT_DXT1:
407
		case R200_TXFORMAT_AI88:
408
		case R200_TXFORMAT_ARGB1555:
409
		case R200_TXFORMAT_RGB565:
410
		case R200_TXFORMAT_ARGB4444:
411
		case R200_TXFORMAT_VYUY422:
412
		case R200_TXFORMAT_YVYU422:
413
		case R200_TXFORMAT_LDVDU655:
414
		case R200_TXFORMAT_DVDU88:
415
		case R200_TXFORMAT_AVYU4444:
416
			track->textures[i].cpp = 2;
417
			break;
418
		case R200_TXFORMAT_ARGB8888:
419
		case R200_TXFORMAT_RGBA8888:
420
		case R200_TXFORMAT_ABGR8888:
421
		case R200_TXFORMAT_BGR111110:
422
		case R200_TXFORMAT_LDVDU8888:
423
		case R200_TXFORMAT_DXT23:
424
		case R200_TXFORMAT_DXT45:
425
			track->textures[i].cpp = 4;
426
			break;
427
		}
428
		track->textures[i].cube_info[4].width = 1 << ((ib_chunk->kdata[idx] >> 16) & 0xf);
429
		track->textures[i].cube_info[4].height = 1 << ((ib_chunk->kdata[idx] >> 20) & 0xf);
430
		break;
431
	case R200_PP_CUBIC_FACES_0:
432
	case R200_PP_CUBIC_FACES_1:
433
	case R200_PP_CUBIC_FACES_2:
434
	case R200_PP_CUBIC_FACES_3:
435
	case R200_PP_CUBIC_FACES_4:
436
	case R200_PP_CUBIC_FACES_5:
437
		tmp = ib_chunk->kdata[idx];
438
		i = (reg - R200_PP_CUBIC_FACES_0) / 32;
439
		for (face = 0; face < 4; face++) {
440
			track->textures[i].cube_info[face].width = 1 << ((tmp >> (face * 8)) & 0xf);
441
			track->textures[i].cube_info[face].height = 1 << ((tmp >> ((face * 8) + 4)) & 0xf);
442
		}
443
		break;
444
	default:
445
		printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n",
446
		       reg, idx);
447
		return -EINVAL;
448
	}
449
	return 0;
450
}
451
#endif
452
 
453
int r200_init(struct radeon_device *rdev)
454
{
455
	rdev->config.r100.reg_safe_bm = r200_reg_safe_bm;
456
	rdev->config.r100.reg_safe_bm_size = ARRAY_SIZE(r200_reg_safe_bm);
457
	return 0;
458
}