1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 **********************************************************/
26 #include "util/u_format.h"
27 #include "util/u_memory.h"
28 #include "util/u_inlines.h"
29 #include "util/u_string.h"
30 #include "util/u_math.h"
32 #include "svga_winsys.h"
33 #include "svga_public.h"
34 #include "svga_context.h"
35 #include "svga_format.h"
36 #include "svga_screen.h"
37 #include "svga_tgsi.h"
38 #include "svga_resource_texture.h"
39 #include "svga_resource.h"
40 #include "svga_debug.h"
42 #include "svga3d_shaderdefs.h"
43 #include "VGPU10ShaderTokens.h"
45 /* NOTE: this constant may get moved into a svga3d*.h header file */
46 #define SVGA3D_DX_MAX_RESOURCE_SIZE (128 * 1024 * 1024)
51 static const struct debug_named_value svga_debug_flags[] = {
52 { "dma", DEBUG_DMA, NULL },
53 { "tgsi", DEBUG_TGSI, NULL },
54 { "pipe", DEBUG_PIPE, NULL },
55 { "state", DEBUG_STATE, NULL },
56 { "screen", DEBUG_SCREEN, NULL },
57 { "tex", DEBUG_TEX, NULL },
58 { "swtnl", DEBUG_SWTNL, NULL },
59 { "const", DEBUG_CONSTS, NULL },
60 { "viewport", DEBUG_VIEWPORT, NULL },
61 { "views", DEBUG_VIEWS, NULL },
62 { "perf", DEBUG_PERF, NULL },
63 { "flush", DEBUG_FLUSH, NULL },
64 { "sync", DEBUG_SYNC, NULL },
65 { "cache", DEBUG_CACHE, NULL },
66 { "streamout", DEBUG_STREAMOUT, NULL },
67 { "query", DEBUG_QUERY, NULL },
73 svga_get_vendor( struct pipe_screen *pscreen )
75 return "VMware, Inc.";
80 svga_get_name( struct pipe_screen *pscreen )
82 const char *build = "", *llvm = "", *mutex = "";
83 static char name[100];
85 /* Only return internal details in the DEBUG version:
87 build = "build: DEBUG;";
88 mutex = "mutex: " PIPE_ATOMIC ";";
89 #elif defined(VMX86_STATS)
90 build = "build: OPT;";
92 build = "build: RELEASE;";
98 util_snprintf(name, sizeof(name), "SVGA3D; %s %s %s", build, mutex, llvm);
103 /** Helper for querying float-valued device cap */
105 get_float_cap(struct svga_winsys_screen *sws, unsigned cap, float defaultVal)
107 SVGA3dDevCapResult result;
108 if (sws->get_cap(sws, cap, &result))
115 /** Helper for querying uint-valued device cap */
117 get_uint_cap(struct svga_winsys_screen *sws, unsigned cap, unsigned defaultVal)
119 SVGA3dDevCapResult result;
120 if (sws->get_cap(sws, cap, &result))
127 /** Helper for querying boolean-valued device cap */
129 get_bool_cap(struct svga_winsys_screen *sws, unsigned cap, boolean defaultVal)
131 SVGA3dDevCapResult result;
132 if (sws->get_cap(sws, cap, &result))
140 svga_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
142 struct svga_screen *svgascreen = svga_screen(screen);
143 struct svga_winsys_screen *sws = svgascreen->sws;
146 case PIPE_CAPF_MAX_LINE_WIDTH:
147 return svgascreen->maxLineWidth;
148 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
149 return svgascreen->maxLineWidthAA;
151 case PIPE_CAPF_MAX_POINT_WIDTH:
153 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
154 return svgascreen->maxPointSize;
156 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
157 return (float) get_uint_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, 4);
159 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
162 case PIPE_CAPF_GUARD_BAND_LEFT:
163 case PIPE_CAPF_GUARD_BAND_TOP:
164 case PIPE_CAPF_GUARD_BAND_RIGHT:
165 case PIPE_CAPF_GUARD_BAND_BOTTOM:
169 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param);
175 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
177 struct svga_screen *svgascreen = svga_screen(screen);
178 struct svga_winsys_screen *sws = svgascreen->sws;
179 SVGA3dDevCapResult result;
182 case PIPE_CAP_NPOT_TEXTURES:
183 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
184 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
186 case PIPE_CAP_TWO_SIDED_STENCIL:
188 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
190 * "In virtually every OpenGL implementation and hardware,
191 * GL_MAX_DUAL_SOURCE_DRAW_BUFFERS is 1"
192 * http://www.opengl.org/wiki/Blending
194 return sws->have_vgpu10 ? 1 : 0;
195 case PIPE_CAP_ANISOTROPIC_FILTER:
197 case PIPE_CAP_POINT_SPRITE:
199 case PIPE_CAP_TGSI_TEXCOORD:
201 case PIPE_CAP_MAX_RENDER_TARGETS:
202 return svgascreen->max_color_buffers;
203 case PIPE_CAP_OCCLUSION_QUERY:
205 case PIPE_CAP_QUERY_TIME_ELAPSED:
207 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
208 return sws->have_vgpu10;
209 case PIPE_CAP_TEXTURE_SHADOW_MAP:
211 case PIPE_CAP_TEXTURE_SWIZZLE:
213 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
215 case PIPE_CAP_USER_VERTEX_BUFFERS:
217 case PIPE_CAP_USER_CONSTANT_BUFFERS:
219 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
222 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
224 unsigned levels = SVGA_MAX_TEXTURE_LEVELS;
225 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
226 levels = MIN2(util_logbase2(result.u) + 1, levels);
228 levels = 12 /* 2048x2048 */;
229 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
230 levels = MIN2(util_logbase2(result.u) + 1, levels);
232 levels = 12 /* 2048x2048 */;
236 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
237 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
238 return 8; /* max 128x128x128 */
239 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
241 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
243 * No mechanism to query the host, and at least limited to 2048x2048 on
246 return MIN2(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
249 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
250 return sws->have_vgpu10 ? SVGA3D_MAX_SURFACE_ARRAYSIZE : 0;
252 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
255 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
257 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
258 return sws->have_vgpu10;
259 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
261 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
262 return !sws->have_vgpu10;
264 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
265 return 1; /* The color outputs of vertex shaders are not clamped */
266 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
267 return 0; /* The driver can't clamp vertex colors */
268 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
269 return 0; /* The driver can't clamp fragment colors */
271 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
272 return 1; /* expected for GL_ARB_framebuffer_object */
274 case PIPE_CAP_GLSL_FEATURE_LEVEL:
275 return sws->have_vgpu10 ? 330 : 120;
277 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
283 case PIPE_CAP_DEPTH_CLIP_DISABLE:
284 case PIPE_CAP_INDEP_BLEND_ENABLE:
285 case PIPE_CAP_CONDITIONAL_RENDER:
286 case PIPE_CAP_QUERY_TIMESTAMP:
287 case PIPE_CAP_TGSI_INSTANCEID:
288 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
289 case PIPE_CAP_SEAMLESS_CUBE_MAP:
290 case PIPE_CAP_FAKE_SW_MSAA:
291 return sws->have_vgpu10;
293 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
294 return sws->have_vgpu10 ? SVGA3D_DX_MAX_SOTARGETS : 0;
295 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
296 return sws->have_vgpu10 ? 4 : 0;
297 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
298 return sws->have_vgpu10 ? SVGA3D_MAX_STREAMOUT_DECLS : 0;
299 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
300 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
302 case PIPE_CAP_TEXTURE_MULTISAMPLE:
303 return svgascreen->ms_samples ? 1 : 0;
305 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
306 return SVGA3D_DX_MAX_RESOURCE_SIZE;
308 case PIPE_CAP_MIN_TEXEL_OFFSET:
309 return sws->have_vgpu10 ? VGPU10_MIN_TEXEL_FETCH_OFFSET : 0;
310 case PIPE_CAP_MAX_TEXEL_OFFSET:
311 return sws->have_vgpu10 ? VGPU10_MAX_TEXEL_FETCH_OFFSET : 0;
313 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
314 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
317 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
318 return sws->have_vgpu10 ? 256 : 0;
319 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
320 return sws->have_vgpu10 ? 1024 : 0;
322 case PIPE_CAP_PRIMITIVE_RESTART:
323 return 1; /* may be a sw fallback, depending on restart index */
325 case PIPE_CAP_GENERATE_MIPMAP:
326 return sws->have_generate_mipmap_cmd;
328 /* Unsupported features */
329 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
330 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
331 case PIPE_CAP_SHADER_STENCIL_EXPORT:
332 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
333 case PIPE_CAP_INDEP_BLEND_FUNC:
334 case PIPE_CAP_TEXTURE_BARRIER:
335 case PIPE_CAP_MAX_VERTEX_STREAMS:
336 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
337 case PIPE_CAP_COMPUTE:
338 case PIPE_CAP_START_INSTANCE:
339 case PIPE_CAP_CUBE_MAP_ARRAY:
340 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
341 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
342 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
343 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
344 case PIPE_CAP_TEXTURE_GATHER_SM5:
345 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
346 case PIPE_CAP_TEXTURE_QUERY_LOD:
347 case PIPE_CAP_SAMPLE_SHADING:
348 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
349 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
350 case PIPE_CAP_DRAW_INDIRECT:
351 case PIPE_CAP_MULTI_DRAW_INDIRECT:
352 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:
353 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
354 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
355 case PIPE_CAP_SAMPLER_VIEW_TARGET:
356 case PIPE_CAP_CLIP_HALFZ:
357 case PIPE_CAP_VERTEXID_NOBASE:
358 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
359 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
360 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
361 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
362 case PIPE_CAP_INVALIDATE_BUFFER:
363 case PIPE_CAP_STRING_MARKER:
364 case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS:
365 case PIPE_CAP_QUERY_MEMORY_INFO:
366 case PIPE_CAP_PCI_GROUP:
367 case PIPE_CAP_PCI_BUS:
368 case PIPE_CAP_PCI_DEVICE:
369 case PIPE_CAP_PCI_FUNCTION:
370 case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:
371 case PIPE_CAP_NATIVE_FENCE_FD:
373 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
375 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
376 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
377 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
378 return 1; /* need 4-byte alignment for all offsets and strides */
379 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
381 case PIPE_CAP_MAX_VIEWPORTS:
383 case PIPE_CAP_ENDIANNESS:
384 return PIPE_ENDIAN_LITTLE;
386 case PIPE_CAP_VENDOR_ID:
387 return 0x15ad; /* VMware Inc. */
388 case PIPE_CAP_DEVICE_ID:
389 return 0x0405; /* assume SVGA II */
390 case PIPE_CAP_ACCELERATED:
392 case PIPE_CAP_VIDEO_MEMORY:
393 /* XXX: Query the host ? */
395 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
396 return sws->have_vgpu10;
397 case PIPE_CAP_CLEAR_TEXTURE:
398 return sws->have_vgpu10;
400 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
401 case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:
402 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
403 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
404 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
405 case PIPE_CAP_DEPTH_BOUNDS_TEST:
406 case PIPE_CAP_TGSI_TXQS:
407 case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
408 case PIPE_CAP_SHAREABLE_SHADERS:
409 case PIPE_CAP_DRAW_PARAMETERS:
410 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
411 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
412 case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY:
413 case PIPE_CAP_QUERY_BUFFER_OBJECT:
414 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
415 case PIPE_CAP_CULL_DISTANCE:
416 case PIPE_CAP_PRIMITIVE_RESTART_FOR_PATCHES:
417 case PIPE_CAP_TGSI_VOTE:
418 case PIPE_CAP_MAX_WINDOW_RECTANGLES:
419 case PIPE_CAP_POLYGON_OFFSET_UNITS_UNSCALED:
420 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
421 case PIPE_CAP_TGSI_ARRAY_COMPONENTS:
422 case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
423 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
424 case PIPE_CAP_TGSI_FS_FBFETCH:
425 case PIPE_CAP_TGSI_MUL_ZERO_WINS:
426 case PIPE_CAP_DOUBLES:
428 case PIPE_CAP_INT64_DIVMOD:
429 case PIPE_CAP_TGSI_TEX_TXF_LZ:
430 case PIPE_CAP_TGSI_CLOCK:
431 case PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE:
432 case PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE:
433 case PIPE_CAP_TGSI_BALLOT:
434 case PIPE_CAP_TGSI_TES_LAYER_VIEWPORT:
438 debug_printf("Unexpected PIPE_CAP_ query %u\n", param);
444 vgpu9_get_shader_param(struct pipe_screen *screen,
445 enum pipe_shader_type shader,
446 enum pipe_shader_cap param)
448 struct svga_screen *svgascreen = svga_screen(screen);
449 struct svga_winsys_screen *sws = svgascreen->sws;
452 assert(!sws->have_vgpu10);
456 case PIPE_SHADER_FRAGMENT:
459 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
460 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
461 return get_uint_cap(sws,
462 SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_INSTRUCTIONS,
464 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
465 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
467 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
468 return SVGA3D_MAX_NESTING_LEVEL;
469 case PIPE_SHADER_CAP_MAX_INPUTS:
471 case PIPE_SHADER_CAP_MAX_OUTPUTS:
472 return svgascreen->max_color_buffers;
473 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
474 return 224 * sizeof(float[4]);
475 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
477 case PIPE_SHADER_CAP_MAX_TEMPS:
478 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, 32);
479 return MIN2(val, SVGA3D_TEMPREG_MAX);
480 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
482 * Although PS 3.0 has some addressing abilities it can only represent
483 * loops that can be statically determined and unrolled. Given we can
484 * only handle a subset of the cases that the state tracker already
485 * does it is better to defer loop unrolling to the state tracker.
488 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
490 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
492 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
493 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
494 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
496 case PIPE_SHADER_CAP_SUBROUTINES:
498 case PIPE_SHADER_CAP_INTEGERS:
500 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
501 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
503 case PIPE_SHADER_CAP_PREFERRED_IR:
504 return PIPE_SHADER_IR_TGSI;
505 case PIPE_SHADER_CAP_SUPPORTED_IRS:
507 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
508 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
509 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
510 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
511 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
512 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
513 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
515 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
518 /* If we get here, we failed to handle a cap above */
519 debug_printf("Unexpected fragment shader query %u\n", param);
521 case PIPE_SHADER_VERTEX:
524 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
525 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
526 return get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS,
528 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
529 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
530 /* XXX: until we have vertex texture support */
532 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
533 return SVGA3D_MAX_NESTING_LEVEL;
534 case PIPE_SHADER_CAP_MAX_INPUTS:
536 case PIPE_SHADER_CAP_MAX_OUTPUTS:
538 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
539 return 256 * sizeof(float[4]);
540 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
542 case PIPE_SHADER_CAP_MAX_TEMPS:
543 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, 32);
544 return MIN2(val, SVGA3D_TEMPREG_MAX);
545 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
547 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
549 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
550 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
552 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
554 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
556 case PIPE_SHADER_CAP_SUBROUTINES:
558 case PIPE_SHADER_CAP_INTEGERS:
560 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
561 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
563 case PIPE_SHADER_CAP_PREFERRED_IR:
564 return PIPE_SHADER_IR_TGSI;
565 case PIPE_SHADER_CAP_SUPPORTED_IRS:
567 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
568 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
569 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
570 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
571 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
572 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
573 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
575 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
578 /* If we get here, we failed to handle a cap above */
579 debug_printf("Unexpected vertex shader query %u\n", param);
581 case PIPE_SHADER_GEOMETRY:
582 case PIPE_SHADER_COMPUTE:
583 case PIPE_SHADER_TESS_CTRL:
584 case PIPE_SHADER_TESS_EVAL:
585 /* no support for geometry, tess or compute shaders at this time */
588 debug_printf("Unexpected shader type (%u) query\n", shader);
596 vgpu10_get_shader_param(struct pipe_screen *screen,
597 enum pipe_shader_type shader,
598 enum pipe_shader_cap param)
600 struct svga_screen *svgascreen = svga_screen(screen);
601 struct svga_winsys_screen *sws = svgascreen->sws;
603 assert(sws->have_vgpu10);
604 (void) sws; /* silence unused var warnings in non-debug builds */
606 /* Only VS, GS, FS supported */
607 if (shader != PIPE_SHADER_VERTEX &&
608 shader != PIPE_SHADER_GEOMETRY &&
609 shader != PIPE_SHADER_FRAGMENT) {
613 /* NOTE: we do not query the device for any caps/limits at this time */
615 /* Generally the same limits for vertex, geometry and fragment shaders */
617 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
618 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
619 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
620 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
622 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
624 case PIPE_SHADER_CAP_MAX_INPUTS:
625 if (shader == PIPE_SHADER_FRAGMENT)
626 return VGPU10_MAX_FS_INPUTS;
627 else if (shader == PIPE_SHADER_GEOMETRY)
628 return VGPU10_MAX_GS_INPUTS;
630 return VGPU10_MAX_VS_INPUTS;
631 case PIPE_SHADER_CAP_MAX_OUTPUTS:
632 if (shader == PIPE_SHADER_FRAGMENT)
633 return VGPU10_MAX_FS_OUTPUTS;
634 else if (shader == PIPE_SHADER_GEOMETRY)
635 return VGPU10_MAX_GS_OUTPUTS;
637 return VGPU10_MAX_VS_OUTPUTS;
638 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
639 return VGPU10_MAX_CONSTANT_BUFFER_ELEMENT_COUNT * sizeof(float[4]);
640 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
641 return svgascreen->max_const_buffers;
642 case PIPE_SHADER_CAP_MAX_TEMPS:
643 return VGPU10_MAX_TEMPS;
644 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
645 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
646 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
647 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
648 return TRUE; /* XXX verify */
649 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
650 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
651 case PIPE_SHADER_CAP_SUBROUTINES:
652 case PIPE_SHADER_CAP_INTEGERS:
654 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
655 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
656 return SVGA3D_DX_MAX_SAMPLERS;
657 case PIPE_SHADER_CAP_PREFERRED_IR:
658 return PIPE_SHADER_IR_TGSI;
659 case PIPE_SHADER_CAP_SUPPORTED_IRS:
661 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
662 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
663 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
664 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
665 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
666 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
667 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
669 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
672 debug_printf("Unexpected vgpu10 shader query %u\n", param);
680 svga_get_shader_param(struct pipe_screen *screen, enum pipe_shader_type shader,
681 enum pipe_shader_cap param)
683 struct svga_screen *svgascreen = svga_screen(screen);
684 struct svga_winsys_screen *sws = svgascreen->sws;
685 if (sws->have_vgpu10) {
686 return vgpu10_get_shader_param(screen, shader, param);
689 return vgpu9_get_shader_param(screen, shader, param);
695 * Implement pipe_screen::is_format_supported().
696 * \param bindings bitmask of PIPE_BIND_x flags
699 svga_is_format_supported( struct pipe_screen *screen,
700 enum pipe_format format,
701 enum pipe_texture_target target,
702 unsigned sample_count,
705 struct svga_screen *ss = svga_screen(screen);
706 SVGA3dSurfaceFormat svga_format;
707 SVGA3dSurfaceFormatCaps caps;
708 SVGA3dSurfaceFormatCaps mask;
712 if (sample_count > 1) {
713 /* In ms_samples, if bit N is set it means that we support
714 * multisample with N+1 samples per pixel.
716 if ((ss->ms_samples & (1 << (sample_count - 1))) == 0) {
721 svga_format = svga_translate_format(ss, format, bindings);
722 if (svga_format == SVGA3D_FORMAT_INVALID) {
726 /* we don't support sRGB rendering into display targets */
727 if (util_format_is_srgb(format) && (bindings & PIPE_BIND_DISPLAY_TARGET)) {
732 * For VGPU10 vertex formats, skip querying host capabilities
735 if (ss->sws->have_vgpu10 && (bindings & PIPE_BIND_VERTEX_BUFFER)) {
736 SVGA3dSurfaceFormat svga_format;
738 svga_translate_vertex_format_vgpu10(format, &svga_format, &flags);
739 return svga_format != SVGA3D_FORMAT_INVALID;
743 * Override host capabilities, so that we end up with the same
744 * visuals for all virtual hardware implementations.
747 if (bindings & PIPE_BIND_DISPLAY_TARGET) {
748 switch (svga_format) {
749 case SVGA3D_A8R8G8B8:
750 case SVGA3D_X8R8G8B8:
755 case SVGA3D_B8G8R8A8_UNORM:
756 case SVGA3D_B8G8R8X8_UNORM:
757 case SVGA3D_B5G6R5_UNORM:
760 /* Often unsupported/problematic. This means we end up with the same
761 * visuals for all virtual hardware implementations.
763 case SVGA3D_A4R4G4B4:
764 case SVGA3D_A1R5G5B5:
773 * Query the host capabilities.
776 svga_get_format_cap(ss, svga_format, &caps);
778 if (bindings & PIPE_BIND_RENDER_TARGET) {
779 /* Check that the color surface is blendable, unless it's an
782 if (!svga_format_is_integer(svga_format) &&
783 (caps.value & SVGA3DFORMAT_OP_NOALPHABLEND)) {
789 if (bindings & PIPE_BIND_RENDER_TARGET) {
790 mask.value |= SVGA3DFORMAT_OP_OFFSCREEN_RENDERTARGET;
792 if (bindings & PIPE_BIND_DEPTH_STENCIL) {
793 mask.value |= SVGA3DFORMAT_OP_ZSTENCIL;
795 if (bindings & PIPE_BIND_SAMPLER_VIEW) {
796 mask.value |= SVGA3DFORMAT_OP_TEXTURE;
799 if (target == PIPE_TEXTURE_CUBE) {
800 mask.value |= SVGA3DFORMAT_OP_CUBETEXTURE;
802 else if (target == PIPE_TEXTURE_3D) {
803 mask.value |= SVGA3DFORMAT_OP_VOLUMETEXTURE;
806 return (caps.value & mask.value) == mask.value;
811 svga_fence_reference(struct pipe_screen *screen,
812 struct pipe_fence_handle **ptr,
813 struct pipe_fence_handle *fence)
815 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
816 sws->fence_reference(sws, ptr, fence);
821 svga_fence_finish(struct pipe_screen *screen,
822 struct pipe_context *ctx,
823 struct pipe_fence_handle *fence,
826 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
829 SVGA_STATS_TIME_PUSH(sws, SVGA_STATS_TIME_FENCEFINISH);
832 retVal = sws->fence_signalled(sws, fence, 0) == 0;
835 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
836 __FUNCTION__, fence);
838 retVal = sws->fence_finish(sws, fence, 0) == 0;
841 SVGA_STATS_TIME_POP(sws);
848 svga_get_driver_query_info(struct pipe_screen *screen,
850 struct pipe_driver_query_info *info)
852 #define QUERY(NAME, ENUM, UNITS) \
853 {NAME, ENUM, {0}, UNITS, PIPE_DRIVER_QUERY_RESULT_TYPE_AVERAGE, 0, 0x0}
855 static const struct pipe_driver_query_info queries[] = {
856 /* per-frame counters */
857 QUERY("num-draw-calls", SVGA_QUERY_NUM_DRAW_CALLS,
858 PIPE_DRIVER_QUERY_TYPE_UINT64),
859 QUERY("num-fallbacks", SVGA_QUERY_NUM_FALLBACKS,
860 PIPE_DRIVER_QUERY_TYPE_UINT64),
861 QUERY("num-flushes", SVGA_QUERY_NUM_FLUSHES,
862 PIPE_DRIVER_QUERY_TYPE_UINT64),
863 QUERY("num-validations", SVGA_QUERY_NUM_VALIDATIONS,
864 PIPE_DRIVER_QUERY_TYPE_UINT64),
865 QUERY("map-buffer-time", SVGA_QUERY_MAP_BUFFER_TIME,
866 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
867 QUERY("num-buffers-mapped", SVGA_QUERY_NUM_BUFFERS_MAPPED,
868 PIPE_DRIVER_QUERY_TYPE_UINT64),
869 QUERY("num-textures-mapped", SVGA_QUERY_NUM_TEXTURES_MAPPED,
870 PIPE_DRIVER_QUERY_TYPE_UINT64),
871 QUERY("num-bytes-uploaded", SVGA_QUERY_NUM_BYTES_UPLOADED,
872 PIPE_DRIVER_QUERY_TYPE_BYTES),
873 QUERY("command-buffer-size", SVGA_QUERY_COMMAND_BUFFER_SIZE,
874 PIPE_DRIVER_QUERY_TYPE_BYTES),
875 QUERY("flush-time", SVGA_QUERY_FLUSH_TIME,
876 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
877 QUERY("surface-write-flushes", SVGA_QUERY_SURFACE_WRITE_FLUSHES,
878 PIPE_DRIVER_QUERY_TYPE_UINT64),
879 QUERY("num-readbacks", SVGA_QUERY_NUM_READBACKS,
880 PIPE_DRIVER_QUERY_TYPE_UINT64),
881 QUERY("num-resource-updates", SVGA_QUERY_NUM_RESOURCE_UPDATES,
882 PIPE_DRIVER_QUERY_TYPE_UINT64),
883 QUERY("num-buffer-uploads", SVGA_QUERY_NUM_BUFFER_UPLOADS,
884 PIPE_DRIVER_QUERY_TYPE_UINT64),
885 QUERY("num-const-buf-updates", SVGA_QUERY_NUM_CONST_BUF_UPDATES,
886 PIPE_DRIVER_QUERY_TYPE_UINT64),
887 QUERY("num-const-updates", SVGA_QUERY_NUM_CONST_UPDATES,
888 PIPE_DRIVER_QUERY_TYPE_UINT64),
890 /* running total counters */
891 QUERY("memory-used", SVGA_QUERY_MEMORY_USED,
892 PIPE_DRIVER_QUERY_TYPE_BYTES),
893 QUERY("num-shaders", SVGA_QUERY_NUM_SHADERS,
894 PIPE_DRIVER_QUERY_TYPE_UINT64),
895 QUERY("num-resources", SVGA_QUERY_NUM_RESOURCES,
896 PIPE_DRIVER_QUERY_TYPE_UINT64),
897 QUERY("num-state-objects", SVGA_QUERY_NUM_STATE_OBJECTS,
898 PIPE_DRIVER_QUERY_TYPE_UINT64),
899 QUERY("num-surface-views", SVGA_QUERY_NUM_SURFACE_VIEWS,
900 PIPE_DRIVER_QUERY_TYPE_UINT64),
901 QUERY("num-generate-mipmap", SVGA_QUERY_NUM_GENERATE_MIPMAP,
902 PIPE_DRIVER_QUERY_TYPE_UINT64),
907 return ARRAY_SIZE(queries);
909 if (index >= ARRAY_SIZE(queries))
912 *info = queries[index];
918 svga_destroy_screen( struct pipe_screen *screen )
920 struct svga_screen *svgascreen = svga_screen(screen);
922 svga_screen_cache_cleanup(svgascreen);
924 mtx_destroy(&svgascreen->swc_mutex);
925 mtx_destroy(&svgascreen->tex_mutex);
927 svgascreen->sws->destroy(svgascreen->sws);
934 * Create a new svga_screen object
937 svga_screen_create(struct svga_winsys_screen *sws)
939 struct svga_screen *svgascreen;
940 struct pipe_screen *screen;
943 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
946 svgascreen = CALLOC_STRUCT(svga_screen);
950 svgascreen->debug.force_level_surface_view =
951 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
952 svgascreen->debug.force_surface_view =
953 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
954 svgascreen->debug.force_sampler_view =
955 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
956 svgascreen->debug.no_surface_view =
957 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
958 svgascreen->debug.no_sampler_view =
959 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
960 svgascreen->debug.no_cache_index_buffers =
961 debug_get_bool_option("SVGA_NO_CACHE_INDEX_BUFFERS", FALSE);
963 screen = &svgascreen->screen;
965 screen->destroy = svga_destroy_screen;
966 screen->get_name = svga_get_name;
967 screen->get_vendor = svga_get_vendor;
968 screen->get_device_vendor = svga_get_vendor; // TODO actual device vendor
969 screen->get_param = svga_get_param;
970 screen->get_shader_param = svga_get_shader_param;
971 screen->get_paramf = svga_get_paramf;
972 screen->get_timestamp = NULL;
973 screen->is_format_supported = svga_is_format_supported;
974 screen->context_create = svga_context_create;
975 screen->fence_reference = svga_fence_reference;
976 screen->fence_finish = svga_fence_finish;
977 screen->get_driver_query_info = svga_get_driver_query_info;
978 svgascreen->sws = sws;
980 svga_init_screen_resource_functions(svgascreen);
982 if (sws->get_hw_version) {
983 svgascreen->hw_version = sws->get_hw_version(sws);
985 svgascreen->hw_version = SVGA3D_HWVERSION_WS65_B1;
989 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
990 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
991 * we prefer the later when available.
993 * This mimics hardware vendors extensions for D3D depth sampling. See also
994 * http://aras-p.info/texts/D3D9GPUHacks.html
998 boolean has_df16, has_df24, has_d24s8_int;
999 SVGA3dSurfaceFormatCaps caps;
1000 SVGA3dSurfaceFormatCaps mask;
1005 svgascreen->depth.z16 = SVGA3D_Z_D16;
1006 svgascreen->depth.x8z24 = SVGA3D_Z_D24X8;
1007 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8;
1009 svga_get_format_cap(svgascreen, SVGA3D_Z_DF16, &caps);
1010 has_df16 = (caps.value & mask.value) == mask.value;
1012 svga_get_format_cap(svgascreen, SVGA3D_Z_DF24, &caps);
1013 has_df24 = (caps.value & mask.value) == mask.value;
1015 svga_get_format_cap(svgascreen, SVGA3D_Z_D24S8_INT, &caps);
1016 has_d24s8_int = (caps.value & mask.value) == mask.value;
1018 /* XXX: We might want some other logic here.
1019 * Like if we only have d24s8_int we should
1020 * emulate the other formats with that.
1023 svgascreen->depth.z16 = SVGA3D_Z_DF16;
1026 svgascreen->depth.x8z24 = SVGA3D_Z_DF24;
1028 if (has_d24s8_int) {
1029 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8_INT;
1033 /* Query device caps
1035 if (sws->have_vgpu10) {
1036 svgascreen->haveProvokingVertex
1037 = get_bool_cap(sws, SVGA3D_DEVCAP_DX_PROVOKING_VERTEX, FALSE);
1038 svgascreen->haveLineSmooth = TRUE;
1039 svgascreen->maxPointSize = 80.0F;
1040 svgascreen->max_color_buffers = SVGA3D_DX_MAX_RENDER_TARGETS;
1042 /* Multisample samples per pixel */
1043 if (debug_get_bool_option("SVGA_MSAA", TRUE)) {
1044 svgascreen->ms_samples =
1045 get_uint_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_MASKABLESAMPLES, 0);
1048 /* Maximum number of constant buffers */
1049 svgascreen->max_const_buffers =
1050 get_uint_cap(sws, SVGA3D_DEVCAP_DX_MAX_CONSTANT_BUFFERS, 1);
1051 assert(svgascreen->max_const_buffers <= SVGA_MAX_CONST_BUFS);
1055 unsigned vs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION,
1056 SVGA3DVSVERSION_NONE);
1057 unsigned fs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION,
1058 SVGA3DPSVERSION_NONE);
1060 /* we require Shader model 3.0 or later */
1061 if (fs_ver < SVGA3DPSVERSION_30 || vs_ver < SVGA3DVSVERSION_30) {
1065 svgascreen->haveProvokingVertex = FALSE;
1067 svgascreen->haveLineSmooth =
1068 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_AA, FALSE);
1070 svgascreen->maxPointSize =
1071 get_float_cap(sws, SVGA3D_DEVCAP_MAX_POINT_SIZE, 1.0f);
1072 /* Keep this to a reasonable size to avoid failures in conform/pntaa.c */
1073 svgascreen->maxPointSize = MIN2(svgascreen->maxPointSize, 80.0f);
1075 /* The SVGA3D device always supports 4 targets at this time, regardless
1076 * of what querying SVGA3D_DEVCAP_MAX_RENDER_TARGETS might return.
1078 svgascreen->max_color_buffers = 4;
1080 /* Only support one constant buffer
1082 svgascreen->max_const_buffers = 1;
1084 /* No multisampling */
1085 svgascreen->ms_samples = 0;
1088 /* common VGPU9 / VGPU10 caps */
1089 svgascreen->haveLineStipple =
1090 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_STIPPLE, FALSE);
1092 svgascreen->maxLineWidth =
1093 get_float_cap(sws, SVGA3D_DEVCAP_MAX_LINE_WIDTH, 1.0f);
1095 svgascreen->maxLineWidthAA =
1096 get_float_cap(sws, SVGA3D_DEVCAP_MAX_AA_LINE_WIDTH, 1.0f);
1099 debug_printf("svga: haveProvokingVertex %u\n",
1100 svgascreen->haveProvokingVertex);
1101 debug_printf("svga: haveLineStip %u "
1102 "haveLineSmooth %u maxLineWidth %f\n",
1103 svgascreen->haveLineStipple, svgascreen->haveLineSmooth,
1104 svgascreen->maxLineWidth);
1105 debug_printf("svga: maxPointSize %g\n", svgascreen->maxPointSize);
1106 debug_printf("svga: msaa samples mask: 0x%x\n", svgascreen->ms_samples);
1109 (void) mtx_init(&svgascreen->tex_mutex, mtx_plain);
1110 (void) mtx_init(&svgascreen->swc_mutex, mtx_plain);
1112 svga_screen_cache_init(svgascreen);
1121 struct svga_winsys_screen *
1122 svga_winsys_screen(struct pipe_screen *screen)
1124 return svga_screen(screen)->sws;
1128 struct svga_screen *
1129 svga_screen(struct pipe_screen *screen)
1132 assert(screen->destroy == svga_destroy_screen);
1133 return (struct svga_screen *)screen;