| /************************************************************************** |
| * |
| * Copyright 2008 VMware, Inc. |
| * All Rights Reserved. |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a |
| * copy of this software and associated documentation files (the |
| * "Software"), to deal in the Software without restriction, including |
| * without limitation the rights to use, copy, modify, merge, publish, |
| * distribute, sub license, and/or sell copies of the Software, and to |
| * permit persons to whom the Software is furnished to do so, subject to |
| * the following conditions: |
| * |
| * The above copyright notice and this permission notice (including the |
| * next paragraph) shall be included in all copies or substantial portions |
| * of the Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
| * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
| * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. |
| * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR |
| * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, |
| * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE |
| * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
| * |
| **************************************************************************/ |
| |
| |
| #include "util/u_memory.h" |
| #include "util/u_math.h" |
| #include "util/u_cpu_detect.h" |
| #include "util/format/u_format.h" |
| #include "util/u_screen.h" |
| #include "util/u_string.h" |
| #include "util/format/u_format_s3tc.h" |
| #include "pipe/p_defines.h" |
| #include "pipe/p_screen.h" |
| #include "draw/draw_context.h" |
| #include "gallivm/lp_bld_type.h" |
| #include "gallivm/lp_bld_nir.h" |
| #include "util/disk_cache.h" |
| #include "util/os_misc.h" |
| #include "util/os_time.h" |
| #include "lp_texture.h" |
| #include "lp_fence.h" |
| #include "lp_jit.h" |
| #include "lp_screen.h" |
| #include "lp_context.h" |
| #include "lp_debug.h" |
| #include "lp_public.h" |
| #include "lp_limits.h" |
| #include "lp_rast.h" |
| #include "lp_cs_tpool.h" |
| |
| #include "frontend/sw_winsys.h" |
| |
| #include "nir.h" |
| |
| #ifdef DEBUG |
| int LP_DEBUG = 0; |
| |
| static const struct debug_named_value lp_debug_flags[] = { |
| { "pipe", DEBUG_PIPE, NULL }, |
| { "tgsi", DEBUG_TGSI, NULL }, |
| { "tex", DEBUG_TEX, NULL }, |
| { "setup", DEBUG_SETUP, NULL }, |
| { "rast", DEBUG_RAST, NULL }, |
| { "query", DEBUG_QUERY, NULL }, |
| { "screen", DEBUG_SCREEN, NULL }, |
| { "counters", DEBUG_COUNTERS, NULL }, |
| { "scene", DEBUG_SCENE, NULL }, |
| { "fence", DEBUG_FENCE, NULL }, |
| { "mem", DEBUG_MEM, NULL }, |
| { "fs", DEBUG_FS, NULL }, |
| { "cs", DEBUG_CS, NULL }, |
| { "tgsi_ir", DEBUG_TGSI_IR, NULL }, |
| { "cl", DEBUG_CL, NULL }, |
| { "cache_stats", DEBUG_CACHE_STATS, NULL }, |
| DEBUG_NAMED_VALUE_END |
| }; |
| #endif |
| |
| int LP_PERF = 0; |
| static const struct debug_named_value lp_perf_flags[] = { |
| { "texmem", PERF_TEX_MEM, NULL }, |
| { "no_mipmap", PERF_NO_MIPMAPS, NULL }, |
| { "no_linear", PERF_NO_LINEAR, NULL }, |
| { "no_mip_linear", PERF_NO_MIP_LINEAR, NULL }, |
| { "no_tex", PERF_NO_TEX, NULL }, |
| { "no_blend", PERF_NO_BLEND, NULL }, |
| { "no_depth", PERF_NO_DEPTH, NULL }, |
| { "no_alphatest", PERF_NO_ALPHATEST, NULL }, |
| DEBUG_NAMED_VALUE_END |
| }; |
| |
| |
| static const char * |
| llvmpipe_get_vendor(struct pipe_screen *screen) |
| { |
| return "Mesa/X.org"; |
| } |
| |
| |
| static const char * |
| llvmpipe_get_name(struct pipe_screen *screen) |
| { |
| static char buf[100]; |
| snprintf(buf, sizeof(buf), "llvmpipe (LLVM " MESA_LLVM_VERSION_STRING ", %u bits)", |
| lp_native_vector_width ); |
| return buf; |
| } |
| |
| |
| static int |
| llvmpipe_get_param(struct pipe_screen *screen, enum pipe_cap param) |
| { |
| switch (param) { |
| case PIPE_CAP_NPOT_TEXTURES: |
| case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES: |
| case PIPE_CAP_MIXED_COLOR_DEPTH_BITS: |
| return 1; |
| case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD: |
| case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES: |
| case PIPE_CAP_VERTEX_SHADER_SATURATE: |
| return 1; |
| case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS: |
| return 1; |
| case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS: |
| return PIPE_MAX_SO_BUFFERS; |
| case PIPE_CAP_POINT_SPRITE: |
| return 1; |
| case PIPE_CAP_MAX_RENDER_TARGETS: |
| return PIPE_MAX_COLOR_BUFS; |
| case PIPE_CAP_OCCLUSION_QUERY: |
| case PIPE_CAP_QUERY_TIMESTAMP: |
| return 1; |
| case PIPE_CAP_QUERY_PIPELINE_STATISTICS: |
| return 1; |
| case PIPE_CAP_TEXTURE_MIRROR_CLAMP: |
| case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE: |
| return 1; |
| case PIPE_CAP_TEXTURE_SWIZZLE: |
| case PIPE_CAP_TEXTURE_SHADOW_LOD: |
| return 1; |
| case PIPE_CAP_MAX_TEXTURE_2D_SIZE: |
| return 1 << (LP_MAX_TEXTURE_2D_LEVELS - 1); |
| case PIPE_CAP_MAX_TEXTURE_3D_LEVELS: |
| return LP_MAX_TEXTURE_3D_LEVELS; |
| case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS: |
| return LP_MAX_TEXTURE_CUBE_LEVELS; |
| case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS: |
| return LP_MAX_TEXTURE_ARRAY_LAYERS; |
| case PIPE_CAP_BLEND_EQUATION_SEPARATE: |
| return 1; |
| case PIPE_CAP_INDEP_BLEND_ENABLE: |
| return 1; |
| case PIPE_CAP_INDEP_BLEND_FUNC: |
| return 1; |
| case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT: |
| case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER: |
| case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER: |
| return 1; |
| case PIPE_CAP_PRIMITIVE_RESTART: |
| case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX: |
| return 1; |
| case PIPE_CAP_DEPTH_CLIP_DISABLE: |
| return 1; |
| case PIPE_CAP_SHADER_STENCIL_EXPORT: |
| return 1; |
| case PIPE_CAP_TGSI_INSTANCEID: |
| case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR: |
| case PIPE_CAP_START_INSTANCE: |
| case PIPE_CAP_MIXED_COLORBUFFER_FORMATS: |
| return 1; |
| case PIPE_CAP_SEAMLESS_CUBE_MAP: |
| case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE: |
| return 1; |
| /* this is a lie could support arbitrary large offsets */ |
| case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET: |
| case PIPE_CAP_MIN_TEXEL_OFFSET: |
| return -32; |
| case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET: |
| case PIPE_CAP_MAX_TEXEL_OFFSET: |
| return 31; |
| case PIPE_CAP_CONDITIONAL_RENDER: |
| case PIPE_CAP_TEXTURE_BARRIER: |
| return 1; |
| case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS: |
| case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS: |
| return 16*4; |
| case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES: |
| case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS: |
| return 1024; |
| case PIPE_CAP_MAX_VERTEX_STREAMS: { |
| struct llvmpipe_screen *lscreen = llvmpipe_screen(screen); |
| return lscreen->use_tgsi ? 1 : 4; |
| } |
| case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE: |
| return 2048; |
| case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME: |
| case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS: |
| case PIPE_CAP_VERTEX_COLOR_UNCLAMPED: |
| case PIPE_CAP_VERTEX_COLOR_CLAMPED: |
| return 1; |
| case PIPE_CAP_GLSL_FEATURE_LEVEL: { |
| struct llvmpipe_screen *lscreen = llvmpipe_screen(screen); |
| return lscreen->use_tgsi ? 330 : 450; |
| } |
| case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY: |
| return 140; |
| case PIPE_CAP_COMPUTE: |
| return GALLIVM_HAVE_CORO; |
| case PIPE_CAP_USER_VERTEX_BUFFERS: |
| return 1; |
| case PIPE_CAP_TGSI_TEXCOORD: |
| case PIPE_CAP_DRAW_INDIRECT: |
| return 1; |
| |
| case PIPE_CAP_CUBE_MAP_ARRAY: |
| return 1; |
| case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT: |
| return 16; |
| case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT: |
| return 64; |
| case PIPE_CAP_TEXTURE_BUFFER_OBJECTS: |
| return 1; |
| case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE: |
| return 65536; |
| case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT: |
| return 16; |
| case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER: |
| return 0; |
| case PIPE_CAP_MAX_VIEWPORTS: |
| return PIPE_MAX_VIEWPORTS; |
| case PIPE_CAP_ENDIANNESS: |
| return PIPE_ENDIAN_NATIVE; |
| case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT: |
| return 1; |
| case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT: |
| return 1; |
| case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS: |
| return 4; |
| case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION: |
| return 1; |
| case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE: |
| return 1; |
| case PIPE_CAP_TGSI_TEX_TXF_LZ: |
| case PIPE_CAP_SAMPLER_VIEW_TARGET: |
| return 1; |
| case PIPE_CAP_FAKE_SW_MSAA: { |
| struct llvmpipe_screen *lscreen = llvmpipe_screen(screen); |
| return lscreen->use_tgsi ? 1 : 0; |
| } |
| case PIPE_CAP_TEXTURE_QUERY_LOD: |
| case PIPE_CAP_CONDITIONAL_RENDER_INVERTED: |
| case PIPE_CAP_TGSI_ARRAY_COMPONENTS: |
| case PIPE_CAP_DOUBLES: |
| case PIPE_CAP_INT64: |
| case PIPE_CAP_INT64_DIVMOD: |
| case PIPE_CAP_QUERY_SO_OVERFLOW: |
| case PIPE_CAP_TGSI_DIV: |
| return 1; |
| |
| case PIPE_CAP_VENDOR_ID: |
| return 0xFFFFFFFF; |
| case PIPE_CAP_DEVICE_ID: |
| return 0xFFFFFFFF; |
| case PIPE_CAP_ACCELERATED: |
| return 0; |
| case PIPE_CAP_VIDEO_MEMORY: { |
| /* XXX: Do we want to return the full amount fo system memory ? */ |
| uint64_t system_memory; |
| |
| if (!os_get_total_physical_memory(&system_memory)) |
| return 0; |
| |
| if (sizeof(void *) == 4) |
| /* Cap to 2 GB on 32 bits system. We do this because llvmpipe does |
| * eat application memory, which is quite limited on 32 bits. App |
| * shouldn't expect too much available memory. */ |
| system_memory = MIN2(system_memory, 2048 << 20); |
| |
| return (int)(system_memory >> 20); |
| } |
| case PIPE_CAP_UMA: |
| return 0; |
| case PIPE_CAP_CLIP_HALFZ: |
| return 1; |
| case PIPE_CAP_POLYGON_OFFSET_CLAMP: |
| case PIPE_CAP_TEXTURE_FLOAT_LINEAR: |
| case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR: |
| return 1; |
| case PIPE_CAP_CULL_DISTANCE: |
| return 1; |
| case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS: |
| return 1; |
| case PIPE_CAP_CLEAR_TEXTURE: |
| return 1; |
| case PIPE_CAP_MAX_VARYINGS: |
| return 32; |
| case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT: |
| return 16; |
| case PIPE_CAP_QUERY_BUFFER_OBJECT: |
| return 1; |
| case PIPE_CAP_DRAW_PARAMETERS: |
| return 1; |
| case PIPE_CAP_FBFETCH: |
| return 8; |
| case PIPE_CAP_FBFETCH_COHERENT: |
| return 0; |
| case PIPE_CAP_MULTI_DRAW_INDIRECT: |
| case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS: |
| return 1; |
| case PIPE_CAP_DEVICE_RESET_STATUS_QUERY: |
| case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR: |
| return 1; |
| case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS: |
| return 32; |
| case PIPE_CAP_RASTERIZER_SUBPIXEL_BITS: |
| return 8; |
| case PIPE_CAP_PCI_GROUP: |
| case PIPE_CAP_PCI_BUS: |
| case PIPE_CAP_PCI_DEVICE: |
| case PIPE_CAP_PCI_FUNCTION: |
| case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY: |
| case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION: |
| return 0; |
| case PIPE_CAP_MAX_GS_INVOCATIONS: |
| return 32; |
| case PIPE_CAP_MAX_SHADER_BUFFER_SIZE: |
| return LP_MAX_TGSI_SHADER_BUFFER_SIZE; |
| case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT: |
| case PIPE_CAP_TGSI_TG4_COMPONENT_IN_SWIZZLE: |
| case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL: |
| return 1; |
| case PIPE_CAP_TGSI_TXQS: |
| case PIPE_CAP_TGSI_VOTE: |
| case PIPE_CAP_LOAD_CONSTBUF: |
| case PIPE_CAP_TEXTURE_MULTISAMPLE: |
| case PIPE_CAP_SAMPLE_SHADING: |
| case PIPE_CAP_POST_DEPTH_COVERAGE: |
| case PIPE_CAP_PACKED_UNIFORMS: { |
| struct llvmpipe_screen *lscreen = llvmpipe_screen(screen); |
| return !lscreen->use_tgsi; |
| } |
| default: |
| return u_pipe_screen_get_param_defaults(screen, param); |
| } |
| } |
| |
| static int |
| llvmpipe_get_shader_param(struct pipe_screen *screen, |
| enum pipe_shader_type shader, |
| enum pipe_shader_cap param) |
| { |
| struct llvmpipe_screen *lscreen = llvmpipe_screen(screen); |
| switch(shader) |
| { |
| case PIPE_SHADER_COMPUTE: |
| if ((LP_DEBUG & DEBUG_CL) && param == PIPE_SHADER_CAP_SUPPORTED_IRS) |
| return (1 << PIPE_SHADER_IR_TGSI) | (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_NIR_SERIALIZED); |
| /* fallthrough */ |
| case PIPE_SHADER_FRAGMENT: |
| if (param == PIPE_SHADER_CAP_PREFERRED_IR) { |
| if (lscreen->use_tgsi) |
| return PIPE_SHADER_IR_TGSI; |
| else |
| return PIPE_SHADER_IR_NIR; |
| } |
| switch (param) { |
| default: |
| return gallivm_get_shader_param(param); |
| } |
| /* fallthrough */ |
| case PIPE_SHADER_TESS_CTRL: |
| case PIPE_SHADER_TESS_EVAL: |
| /* Tessellation shader needs llvm coroutines support */ |
| if (!GALLIVM_HAVE_CORO || lscreen->use_tgsi) |
| return 0; |
| /* fallthrough */ |
| case PIPE_SHADER_VERTEX: |
| case PIPE_SHADER_GEOMETRY: |
| if (param == PIPE_SHADER_CAP_PREFERRED_IR) { |
| if (lscreen->use_tgsi) |
| return PIPE_SHADER_IR_TGSI; |
| else |
| return PIPE_SHADER_IR_NIR; |
| } |
| |
| switch (param) { |
| case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS: |
| /* At this time, the draw module and llvmpipe driver only |
| * support vertex shader texture lookups when LLVM is enabled in |
| * the draw module. |
| */ |
| if (debug_get_bool_option("DRAW_USE_LLVM", TRUE)) |
| return PIPE_MAX_SAMPLERS; |
| else |
| return 0; |
| case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS: |
| if (debug_get_bool_option("DRAW_USE_LLVM", TRUE)) |
| return PIPE_MAX_SHADER_SAMPLER_VIEWS; |
| else |
| return 0; |
| default: |
| return draw_get_shader_param(shader, param); |
| } |
| default: |
| return 0; |
| } |
| } |
| |
| static float |
| llvmpipe_get_paramf(struct pipe_screen *screen, enum pipe_capf param) |
| { |
| switch (param) { |
| case PIPE_CAPF_MAX_LINE_WIDTH: |
| /* fall-through */ |
| case PIPE_CAPF_MAX_LINE_WIDTH_AA: |
| return 255.0; /* arbitrary */ |
| case PIPE_CAPF_MAX_POINT_WIDTH: |
| /* fall-through */ |
| case PIPE_CAPF_MAX_POINT_WIDTH_AA: |
| return LP_MAX_POINT_WIDTH; /* arbitrary */ |
| case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY: |
| return 16.0; /* not actually signficant at this time */ |
| case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS: |
| return 16.0; /* arbitrary */ |
| case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE: |
| return 0.0; |
| case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE: |
| return 0.0; |
| case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY: |
| return 0.0; |
| } |
| /* should only get here on unhandled cases */ |
| debug_printf("Unexpected PIPE_CAP %d query\n", param); |
| return 0.0; |
| } |
| |
| static int |
| llvmpipe_get_compute_param(struct pipe_screen *_screen, |
| enum pipe_shader_ir ir_type, |
| enum pipe_compute_cap param, |
| void *ret) |
| { |
| switch (param) { |
| case PIPE_COMPUTE_CAP_IR_TARGET: |
| return 0; |
| case PIPE_COMPUTE_CAP_MAX_GRID_SIZE: |
| if (ret) { |
| uint64_t *grid_size = ret; |
| grid_size[0] = 65535; |
| grid_size[1] = 65535; |
| grid_size[2] = 65535; |
| } |
| return 3 * sizeof(uint64_t) ; |
| case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE: |
| if (ret) { |
| uint64_t *block_size = ret; |
| block_size[0] = 1024; |
| block_size[1] = 1024; |
| block_size[2] = 1024; |
| } |
| return 3 * sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK: |
| if (ret) { |
| uint64_t *max_threads_per_block = ret; |
| *max_threads_per_block = 1024; |
| } |
| return sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE: |
| if (ret) { |
| uint64_t *max_local_size = ret; |
| *max_local_size = 32768; |
| } |
| return sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_GRID_DIMENSION: |
| if (ret) { |
| uint32_t *grid_dim = ret; |
| *grid_dim = 3; |
| } |
| return sizeof(uint32_t); |
| case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE: |
| if (ret) { |
| uint64_t *max_global_size = ret; |
| *max_global_size = (1ULL << 31); |
| } |
| return sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE: |
| if (ret) { |
| uint64_t *max_mem_alloc_size = ret; |
| *max_mem_alloc_size = (1ULL << 31); |
| } |
| return sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE: |
| if (ret) { |
| uint64_t *max_private = ret; |
| *max_private = (1UL << 31); |
| } |
| return sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE: |
| if (ret) { |
| uint64_t *max_input = ret; |
| *max_input = 4096; |
| } |
| return sizeof(uint64_t); |
| case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED: |
| if (ret) { |
| uint32_t *images = ret; |
| *images = 0; |
| } |
| return sizeof(uint32_t); |
| case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK: |
| return 0; |
| case PIPE_COMPUTE_CAP_SUBGROUP_SIZE: |
| if (ret) { |
| uint32_t *subgroup_size = ret; |
| *subgroup_size = 32; |
| } |
| return sizeof(uint32_t); |
| case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS: |
| if (ret) { |
| uint32_t *max_compute_units = ret; |
| *max_compute_units = 8; |
| } |
| return sizeof(uint32_t); |
| case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY: |
| if (ret) { |
| uint32_t *max_clock_freq = ret; |
| *max_clock_freq = 300; |
| } |
| return sizeof(uint32_t); |
| case PIPE_COMPUTE_CAP_ADDRESS_BITS: |
| if (ret) { |
| uint32_t *address_bits = ret; |
| *address_bits = 64; |
| } |
| return sizeof(uint32_t); |
| } |
| return 0; |
| } |
| |
| static const struct nir_shader_compiler_options gallivm_nir_options = { |
| .lower_scmp = true, |
| .lower_flrp32 = true, |
| .lower_flrp64 = true, |
| .lower_fsat = true, |
| .lower_bitfield_insert_to_shifts = true, |
| .lower_bitfield_extract_to_shifts = true, |
| .lower_sub = true, |
| .lower_fmod = true, |
| .lower_hadd = true, |
| .lower_add_sat = true, |
| .lower_ldexp = true, |
| .lower_pack_snorm_2x16 = true, |
| .lower_pack_snorm_4x8 = true, |
| .lower_pack_unorm_2x16 = true, |
| .lower_pack_unorm_4x8 = true, |
| .lower_pack_half_2x16 = true, |
| .lower_pack_split = true, |
| .lower_unpack_snorm_2x16 = true, |
| .lower_unpack_snorm_4x8 = true, |
| .lower_unpack_unorm_2x16 = true, |
| .lower_unpack_unorm_4x8 = true, |
| .lower_unpack_half_2x16 = true, |
| .lower_extract_byte = true, |
| .lower_extract_word = true, |
| .lower_rotate = true, |
| .lower_uadd_carry = true, |
| .lower_usub_borrow = true, |
| .lower_mul_2x32_64 = true, |
| .lower_ifind_msb = true, |
| .max_unroll_iterations = 32, |
| .use_interpolated_input_intrinsics = true, |
| .lower_to_scalar = true, |
| .lower_cs_local_index_from_id = true, |
| .lower_uniforms_to_ubo = true, |
| }; |
| |
| static void |
| llvmpipe_finalize_nir(struct pipe_screen *screen, |
| void *nirptr, |
| bool optimize) |
| { |
| struct nir_shader *nir = (struct nir_shader *)nirptr; |
| lp_build_opt_nir(nir); |
| } |
| |
| static inline const void * |
| llvmpipe_get_compiler_options(struct pipe_screen *screen, |
| enum pipe_shader_ir ir, |
| enum pipe_shader_type shader) |
| { |
| assert(ir == PIPE_SHADER_IR_NIR); |
| return &gallivm_nir_options; |
| } |
| |
| /** |
| * Query format support for creating a texture, drawing surface, etc. |
| * \param format the format to test |
| * \param type one of PIPE_TEXTURE, PIPE_SURFACE |
| */ |
| static bool |
| llvmpipe_is_format_supported( struct pipe_screen *_screen, |
| enum pipe_format format, |
| enum pipe_texture_target target, |
| unsigned sample_count, |
| unsigned storage_sample_count, |
| unsigned bind) |
| { |
| struct llvmpipe_screen *screen = llvmpipe_screen(_screen); |
| struct sw_winsys *winsys = screen->winsys; |
| const struct util_format_description *format_desc; |
| |
| format_desc = util_format_description(format); |
| if (!format_desc) |
| return false; |
| |
| assert(target == PIPE_BUFFER || |
| target == PIPE_TEXTURE_1D || |
| target == PIPE_TEXTURE_1D_ARRAY || |
| target == PIPE_TEXTURE_2D || |
| target == PIPE_TEXTURE_2D_ARRAY || |
| target == PIPE_TEXTURE_RECT || |
| target == PIPE_TEXTURE_3D || |
| target == PIPE_TEXTURE_CUBE || |
| target == PIPE_TEXTURE_CUBE_ARRAY); |
| |
| if (sample_count != 0 && sample_count != 1 && sample_count != 4) |
| return false; |
| |
| if (MAX2(1, sample_count) != MAX2(1, storage_sample_count)) |
| return false; |
| |
| if (bind & PIPE_BIND_RENDER_TARGET) { |
| if (format_desc->colorspace == UTIL_FORMAT_COLORSPACE_SRGB) { |
| /* this is a lie actually other formats COULD exist where we would fail */ |
| if (format_desc->nr_channels < 3) |
| return false; |
| } |
| else if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_RGB) |
| return false; |
| |
| if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN && |
| format != PIPE_FORMAT_R11G11B10_FLOAT) |
| return false; |
| |
| assert(format_desc->block.width == 1); |
| assert(format_desc->block.height == 1); |
| |
| if (format_desc->is_mixed) |
| return false; |
| |
| if (!format_desc->is_array && !format_desc->is_bitmask && |
| format != PIPE_FORMAT_R11G11B10_FLOAT) |
| return false; |
| } |
| |
| if ((bind & (PIPE_BIND_RENDER_TARGET | PIPE_BIND_SAMPLER_VIEW)) && |
| ((bind & PIPE_BIND_DISPLAY_TARGET) == 0)) { |
| /* Disable all 3-channel formats, where channel size != 32 bits. |
| * In some cases we run into crashes (in generate_unswizzled_blend()), |
| * for 3-channel RGB16 variants, there was an apparent LLVM bug. |
| * In any case, disabling the shallower 3-channel formats avoids a |
| * number of issues with GL_ARB_copy_image support. |
| */ |
| if (format_desc->is_array && |
| format_desc->nr_channels == 3 && |
| format_desc->block.bits != 96) { |
| return false; |
| } |
| } |
| |
| if (bind & PIPE_BIND_DISPLAY_TARGET) { |
| if(!winsys->is_displaytarget_format_supported(winsys, bind, format)) |
| return false; |
| } |
| |
| if (bind & PIPE_BIND_DEPTH_STENCIL) { |
| if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN) |
| return false; |
| |
| if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS) |
| return false; |
| } |
| |
| if (format_desc->layout == UTIL_FORMAT_LAYOUT_ASTC || |
| format_desc->layout == UTIL_FORMAT_LAYOUT_ATC || |
| format_desc->layout == UTIL_FORMAT_LAYOUT_FXT1) { |
| /* Software decoding is not hooked up. */ |
| return false; |
| } |
| |
| if (format_desc->layout == UTIL_FORMAT_LAYOUT_ETC && |
| format != PIPE_FORMAT_ETC1_RGB8) |
| return false; |
| |
| /* |
| * Everything can be supported by u_format |
| * (those without fetch_rgba_float might be not but shouldn't hit that) |
| */ |
| |
| return true; |
| } |
| |
| |
| |
| |
| static void |
| llvmpipe_flush_frontbuffer(struct pipe_screen *_screen, |
| struct pipe_resource *resource, |
| unsigned level, unsigned layer, |
| void *context_private, |
| struct pipe_box *sub_box) |
| { |
| struct llvmpipe_screen *screen = llvmpipe_screen(_screen); |
| struct sw_winsys *winsys = screen->winsys; |
| struct llvmpipe_resource *texture = llvmpipe_resource(resource); |
| |
| assert(texture->dt); |
| if (texture->dt) |
| winsys->displaytarget_display(winsys, texture->dt, context_private, sub_box); |
| } |
| |
| static void |
| llvmpipe_destroy_screen( struct pipe_screen *_screen ) |
| { |
| struct llvmpipe_screen *screen = llvmpipe_screen(_screen); |
| struct sw_winsys *winsys = screen->winsys; |
| |
| if (screen->cs_tpool) |
| lp_cs_tpool_destroy(screen->cs_tpool); |
| |
| if (screen->rast) |
| lp_rast_destroy(screen->rast); |
| |
| lp_jit_screen_cleanup(screen); |
| |
| if (LP_DEBUG & DEBUG_CACHE_STATS) |
| printf("disk shader cache: hits = %u, misses = %u\n", screen->num_disk_shader_cache_hits, |
| screen->num_disk_shader_cache_misses); |
| disk_cache_destroy(screen->disk_shader_cache); |
| if(winsys->destroy) |
| winsys->destroy(winsys); |
| |
| glsl_type_singleton_decref(); |
| |
| mtx_destroy(&screen->rast_mutex); |
| mtx_destroy(&screen->cs_mutex); |
| FREE(screen); |
| } |
| |
| |
| |
| |
| /** |
| * Fence reference counting. |
| */ |
| static void |
| llvmpipe_fence_reference(struct pipe_screen *screen, |
| struct pipe_fence_handle **ptr, |
| struct pipe_fence_handle *fence) |
| { |
| struct lp_fence **old = (struct lp_fence **) ptr; |
| struct lp_fence *f = (struct lp_fence *) fence; |
| |
| lp_fence_reference(old, f); |
| } |
| |
| |
| /** |
| * Wait for the fence to finish. |
| */ |
| static bool |
| llvmpipe_fence_finish(struct pipe_screen *screen, |
| struct pipe_context *ctx, |
| struct pipe_fence_handle *fence_handle, |
| uint64_t timeout) |
| { |
| struct lp_fence *f = (struct lp_fence *) fence_handle; |
| |
| if (!timeout) |
| return lp_fence_signalled(f); |
| |
| if (!lp_fence_signalled(f)) { |
| if (timeout != PIPE_TIMEOUT_INFINITE) |
| return lp_fence_timedwait(f, timeout); |
| |
| lp_fence_wait(f); |
| } |
| return true; |
| } |
| |
| static uint64_t |
| llvmpipe_get_timestamp(struct pipe_screen *_screen) |
| { |
| return os_time_get_nano(); |
| } |
| |
| static void lp_disk_cache_create(struct llvmpipe_screen *screen) |
| { |
| struct mesa_sha1 ctx; |
| unsigned gallivm_perf = gallivm_get_perf_flags(); |
| unsigned char sha1[20]; |
| char cache_id[20 * 2 + 1]; |
| _mesa_sha1_init(&ctx); |
| |
| if (!disk_cache_get_function_identifier(lp_disk_cache_create, &ctx) || |
| !disk_cache_get_function_identifier(LLVMLinkInMCJIT, &ctx)) |
| return; |
| |
| _mesa_sha1_update(&ctx, &gallivm_perf, sizeof(gallivm_perf)); |
| _mesa_sha1_final(&ctx, sha1); |
| disk_cache_format_hex_id(cache_id, sha1, 20 * 2); |
| |
| screen->disk_shader_cache = disk_cache_create("llvmpipe", cache_id, 0); |
| } |
| |
| static struct disk_cache *lp_get_disk_shader_cache(struct pipe_screen *_screen) |
| { |
| struct llvmpipe_screen *screen = llvmpipe_screen(_screen); |
| |
| return screen->disk_shader_cache; |
| } |
| |
| void lp_disk_cache_find_shader(struct llvmpipe_screen *screen, |
| struct lp_cached_code *cache, |
| unsigned char ir_sha1_cache_key[20]) |
| { |
| unsigned char sha1[CACHE_KEY_SIZE]; |
| |
| if (!screen->disk_shader_cache) |
| return; |
| disk_cache_compute_key(screen->disk_shader_cache, ir_sha1_cache_key, 20, sha1); |
| |
| size_t binary_size; |
| uint8_t *buffer = disk_cache_get(screen->disk_shader_cache, sha1, &binary_size); |
| if (!buffer) { |
| cache->data_size = 0; |
| p_atomic_inc(&screen->num_disk_shader_cache_misses); |
| return; |
| } |
| cache->data_size = binary_size; |
| cache->data = buffer; |
| p_atomic_inc(&screen->num_disk_shader_cache_hits); |
| } |
| |
| void lp_disk_cache_insert_shader(struct llvmpipe_screen *screen, |
| struct lp_cached_code *cache, |
| unsigned char ir_sha1_cache_key[20]) |
| { |
| unsigned char sha1[CACHE_KEY_SIZE]; |
| |
| if (!screen->disk_shader_cache || !cache->data_size || cache->dont_cache) |
| return; |
| disk_cache_compute_key(screen->disk_shader_cache, ir_sha1_cache_key, 20, sha1); |
| disk_cache_put(screen->disk_shader_cache, sha1, cache->data, cache->data_size, NULL); |
| } |
| /** |
| * Create a new pipe_screen object |
| * Note: we're not presently subclassing pipe_screen (no llvmpipe_screen). |
| */ |
| struct pipe_screen * |
| llvmpipe_create_screen(struct sw_winsys *winsys) |
| { |
| struct llvmpipe_screen *screen; |
| |
| util_cpu_detect(); |
| |
| glsl_type_singleton_init_or_ref(); |
| |
| #ifdef DEBUG |
| LP_DEBUG = debug_get_flags_option("LP_DEBUG", lp_debug_flags, 0 ); |
| #endif |
| |
| LP_PERF = debug_get_flags_option("LP_PERF", lp_perf_flags, 0 ); |
| |
| screen = CALLOC_STRUCT(llvmpipe_screen); |
| if (!screen) |
| return NULL; |
| |
| if (!lp_jit_screen_init(screen)) { |
| FREE(screen); |
| return NULL; |
| } |
| |
| screen->winsys = winsys; |
| |
| screen->base.destroy = llvmpipe_destroy_screen; |
| |
| screen->base.get_name = llvmpipe_get_name; |
| screen->base.get_vendor = llvmpipe_get_vendor; |
| screen->base.get_device_vendor = llvmpipe_get_vendor; // TODO should be the CPU vendor |
| screen->base.get_param = llvmpipe_get_param; |
| screen->base.get_shader_param = llvmpipe_get_shader_param; |
| screen->base.get_compute_param = llvmpipe_get_compute_param; |
| screen->base.get_paramf = llvmpipe_get_paramf; |
| screen->base.get_compiler_options = llvmpipe_get_compiler_options; |
| screen->base.is_format_supported = llvmpipe_is_format_supported; |
| |
| screen->base.context_create = llvmpipe_create_context; |
| screen->base.flush_frontbuffer = llvmpipe_flush_frontbuffer; |
| screen->base.fence_reference = llvmpipe_fence_reference; |
| screen->base.fence_finish = llvmpipe_fence_finish; |
| |
| screen->base.get_timestamp = llvmpipe_get_timestamp; |
| |
| screen->base.finalize_nir = llvmpipe_finalize_nir; |
| |
| screen->base.get_disk_shader_cache = lp_get_disk_shader_cache; |
| llvmpipe_init_screen_resource_funcs(&screen->base); |
| |
| screen->use_tgsi = (LP_DEBUG & DEBUG_TGSI_IR); |
| screen->num_threads = util_cpu_caps.nr_cpus > 1 ? util_cpu_caps.nr_cpus : 0; |
| #ifdef EMBEDDED_DEVICE |
| screen->num_threads = 0; |
| #endif |
| screen->num_threads = debug_get_num_option("LP_NUM_THREADS", screen->num_threads); |
| screen->num_threads = MIN2(screen->num_threads, LP_MAX_THREADS); |
| |
| screen->rast = lp_rast_create(screen->num_threads); |
| if (!screen->rast) { |
| lp_jit_screen_cleanup(screen); |
| FREE(screen); |
| return NULL; |
| } |
| (void) mtx_init(&screen->rast_mutex, mtx_plain); |
| |
| screen->cs_tpool = lp_cs_tpool_create(screen->num_threads); |
| if (!screen->cs_tpool) { |
| lp_rast_destroy(screen->rast); |
| lp_jit_screen_cleanup(screen); |
| FREE(screen); |
| return NULL; |
| } |
| (void) mtx_init(&screen->cs_mutex, mtx_plain); |
| |
| lp_disk_cache_create(screen); |
| return &screen->base; |
| } |