From da02083ce6ce77ed90db4be4c628118150f99df1 Mon Sep 17 00:00:00 2001 From: tnn Date: Sun, 13 Mar 2022 15:50:05 +0000 Subject: MesaLib: update to 21.3.7 Of particular note is this change in Mesa 21.2: "32-bit x86 builds now default disable x87 math and use sse2." This might need to be revisited in pkgsrc. Bugfixes omitted from ChangeLog. New features in Mesa 21.3: VK_EXT_color_write_enable on lavapipe GL_ARB_texture_filter_anisotropic in llvmpipe Anisotropic texture filtering in lavapipe VK_EXT_shader_atomic_float2 on Intel and RADV. VK_EXT_vertex_input_dynamic_state on RADV. VK_KHR_timeline_semaphore on lavapipe VK_EXT_external_memory_host on lavapipe GL_AMD_pinned_memory on llvmpipe GL 4.5 compatibility on llvmpipe VK_EXT_primitive_topology_list_restart on RADV and lavapipe. ES 3.2 on zink VK_KHR_depth_stencil_resolve on lavapipe VK_KHR_shader_integer_dot_product on RADV. OpenGL FP16 support on llvmpipe VK_KHR_shader_float16_int8 on lavapipe VK_KHR_shader_subgroup_extended_types on lavapipe VK_KHR_spirv_1_4 on lavapipe Experimental raytracing support on RADV VK_KHR_synchronization2 on Intel NGG shader based culling is now enabled by default on GFX10.3 on RADV. VK_KHR_maintenance4 on RADV VK_KHR_format_feature_flags2 on RADV. EGL_EXT_present_opaque on wayland New features in Mesa 21.2: zink supports GL_ARB_texture_filter_minmax, GL_ARB_shader_clock VK_EXT_provoking_vertex on RADV. VK_EXT_extended_dynamic_state2 on RADV. VK_EXT_global_priority_query on RADV. VK_EXT_physical_device_drm on RADV. VK_KHR_shader_subgroup_uniform_control_flow on Intel and RADV. VK_EXT_color_write_enable on RADV. 32-bit x86 builds now default disable x87 math and use sse2. GL ES 3.1 on GT21x hardware. VK_EXT_acquire_drm_display on RADV and ANV. VK_EXT_vertex_input_dynamic_state on lavapipe wideLines on lavapipe VK_EXT_line_rasterization on lavapipe VK_EXT_multi_draw on ANV, lavapipe, and RADV VK_KHR_separate_depth_stencil_layouts on lavapipe VK_EXT_separate_stencil_usage on lavapipe VK_EXT_extended_dynamic_state2 on lavapipe NGG shader based primitive culling is now supported by RADV. Panfrost supports OpenGL ES 3.1 New Asahi driver for the Apple M1 GL_ARB_sample_locations on zink GL_ARB_sparse_buffer on zink GL_ARB_shader_group_vote on zink DRM format modifiers on zink freedreno+turnip: Initial support for a6xx gen4 (a660, a635) New features in Mesa 21.1: VK_KHR_workgroup_memory_explicit_layout on Intel, RADV DRM format modifiers for AMD. VK_KHR_zero_initialize_workgroup_memory on Intel, RADV Zink exposes GL 4.6 and ES 3.1 GL_EXT_depth_bounds_test on softpipe, zink GL_EXT_texture_filter_minmax on nvc0 (gm200+) GL_ARB_texture_filter_minmax on nvc0 (gm200+) GL_ARB_post_depth_coverage on zink VK_KHR_copy_commands2 on lavapipe lavapipe exposes Vulkan 1.1 VRS attachment on RADV New features in Mesa 21.0: GL_EXT_demote_to_helper_invocation on radeonsi GL_NV_compute_shader_derivatives on radeonsi EGL_MESA_platform_xcb Removed GL_NV_point_sprite for classic swrast. driconf: remove glx_disable_oml_sync_control, glx_disable_sgi_video_sync, and glx_disable_ext_buffer_age Removed support for loading DRI drivers older than Mesa 8.0, including all DRI1 support Add support for VK_VALVE_mutable_descriptor_type on RADV Removed classic OSMesa in favor of the newly improved gallium OSMesa VK_KHR_fragment_shading_rate on RADV (RDNA2 only) Freedreno a6xx exposes GL 3.3 Classic swrast dri driver removed in favor of gallium swrast (llvmpipe or softpipe) Panfrost g31/g52/g72 exposes ES 3.0 Panfrost t760+ exposes GL 3.1 (including on Bifrost) Sparse memory support on RADV Rapid packed math (16bit-vectorization) on RADV New features in Mesa 20.3: GL 4.5 on llvmpipe GL_INTEL_blackhole_render on radeonsi GL_NV_copy_depth_to_color for NIR GL_NV_half_float GL_NV_shader_atomic_int64 on radeonsi EGL_KHR_swap_buffers_with_damage on X11 (DRI3) VK_PRESENT_MODE_FIFO_RELAXED on X11 GLX_EXT_swap_control for DRI2 and DRI3 GLX_EXT_swap_control_tear for DRI3 VK_KHR_copy_commands2 on RADV VK_KHR_shader_terminate_invocation on RADV NGG GS support in ACO VK_KHR_shader_terminate_invocation on ANV driconf: add glx_extension_override driconf: add indirect_gl_extension_override VK_AMD_mixed_attachment_samples on RADV (GFX6-GFX7). GL_MESA_pack_invert on r100 and vieux GL_ANGLE_pack_reverse_row_order VK_EXT_shader_image_atomic_int64 on RADV New features in mesa 20.2: GL_ARB_compute_variable_group_size on Iris. GL_ARB_gpu_shader5 on llvmpipe GL_ARB_post_depth_coverage on llvmpipe GLES 3.2 on llvmpipe GL_EXT_shader_group_vote on GLES3. GL_EXT_texture_shadow_lod on llvmpipe VK_AMD_texture_gather_bias_lod on RADV. VK_AMD_gpu_shader_half_float on RADV/ACO. VK_AMD_gpu_shader_int16 on RADV/ACO. VK_EXT_extended_dynamic_state on ANV and RADV. VK_EXT_image_robustness on RADV. VK_EXT_private_data on ANV and RADV. VK_EXT_custom_border_color on ANV and RADV. VK_EXT_pipeline_creation_cache_control on ANV and RADV. VK_EXT_shader_demote_to_helper_invocation on RADV/LLVM. VK_EXT_subgroup_size_control on RADV/ACO. VK_GOOGLE_user_type on ANV and RADV. VK_KHR_shader_subgroup_extended_types on RADV/ACO. GL_ARB_gl_spirv on nvc0/nir. GL_ARB_spirv_extensions on nvc0/nir. RADV now uses ACO per default as backend RADV_DEBUG=llvm option to enable LLVM backend for RADV VK_EXT_image_robustness for ANV VK_EXT_shader_atomic_float on ANV VK_EXT_4444_formats on ANV and RADV. VK_KHR_memory_model on RADV. GL 4.5 on llvmpipe EGL_KHR_swap_buffers_with_damage on X11 (DRI3) New features in mesa 20.1: GL_ARB_compute_variable_group_size on i965. GL_EXT_depth_bounds_test on Iris. GL_EXT_texture_shadow_lod on radeonsi, nvc0. GL_NV_alpha_to_coverage_dither_control on radeonsi GL_NV_copy_image on all gallium drivers. GL_NV_pixel_buffer_object on all gallium drivers, i915, i965, swrast. GL_NV_viewport_array2 on nvc0 (GM200+). GL_NV_viewport_swizzle on nvc0 (GM200+). VK_AMD_memory_overallocation_behavior on RADV. VK_KHR_shader_non_semantic_info on Intel, RADV. GL_EXT_draw_instanced on gles2 VK_KHR_8bit_storage for ACO on GFX8+ VK_KHR_16bit_storage for ACO on GFX8+ (storageInputOutput16 is still unsupported) shaderInt16 for ACO on GFX9+ VK_KHR_shader_float16_int8 for ACO on GFX8+ (shaderFloat16 is still unsupported) VK_EXT_robustness2 on Intel, RADV. Add Rocket Lake (RKL) support on anvil and iris. --- .../MesaLib/patches/patch-src_util_u__thread.h | 108 ++++++++------------- 1 file changed, 41 insertions(+), 67 deletions(-) (limited to 'graphics/MesaLib/patches/patch-src_util_u__thread.h') diff --git a/graphics/MesaLib/patches/patch-src_util_u__thread.h b/graphics/MesaLib/patches/patch-src_util_u__thread.h index 64db83fb096..d4e6882b489 100644 --- a/graphics/MesaLib/patches/patch-src_util_u__thread.h +++ b/graphics/MesaLib/patches/patch-src_util_u__thread.h @@ -1,95 +1,69 @@ -$NetBSD: patch-src_util_u__thread.h,v 1.4 2020/03/08 10:35:03 tnn Exp $ +$NetBSD: patch-src_util_u__thread.h,v 1.5 2022/03/13 15:50:05 tnn Exp $ Oracle Solaris has pthread_setname_np. illumos does not. +(actually, newer Illumos does have it, but never mind.) Don't hard error when there's no pthread_setname_np. handle NetBSD-style pthread_setaffinity_np(3) ---- src/util/u_thread.h.orig 2020-03-05 21:34:32.000000000 +0000 +--- src/util/u_thread.h.orig 2021-08-04 18:49:29.374474500 +0000 +++ src/util/u_thread.h -@@ -73,7 +73,7 @@ static inline thrd_t u_thread_create(int +@@ -129,7 +129,7 @@ static inline thrd_t u_thread_create(int static inline void u_thread_setname( const char *name ) { #if defined(HAVE_PTHREAD) -#if DETECT_OS_LINUX || DETECT_OS_CYGWIN || DETECT_OS_SOLARIS +#if DETECT_OS_LINUX || DETECT_OS_CYGWIN - pthread_setname_np(pthread_self(), name); - #elif DETECT_OS_FREEBSD || DETECT_OS_OPENBSD - pthread_set_name_np(pthread_self(), name); -@@ -104,6 +104,17 @@ static inline void - util_pin_thread_to_L3(thrd_t thread, unsigned L3_index, unsigned cores_per_L3) + int ret = pthread_setname_np(pthread_self(), name); + if (ret == ERANGE) { + char buf[16]; +@@ -169,8 +169,32 @@ util_set_thread_affinity(thrd_t thread, + unsigned num_mask_bits) { #if defined(HAVE_PTHREAD_SETAFFINITY) -+#if defined(__NetBSD__) -+ cpuset_t *cpuset; +- cpu_set_t cpuset; ++# if defined(__NetBSD__) ++ cpu_set_t *cpuset; + cpuset = cpuset_create(); + if (cpuset == NULL) + return; -+ cpuset_zero(cpuset); -+ for (unsigned i = 0; i < cores_per_L3; i++) -+ cpuset_set(L3_index * cores_per_L3 + i, cpuset); -+ pthread_setaffinity_np(thread, cpuset_size(cpuset), cpuset); -+ cpuset_destroy(cpuset); -+#else - cpu_set_t cpuset; ++ if (old_mask) { ++ if (pthread_getaffinity_np(thread, cpuset_size(cpuset), cpuset) != 0) ++ return false; - CPU_ZERO(&cpuset); -@@ -111,6 +122,7 @@ util_pin_thread_to_L3(thrd_t thread, uns - CPU_SET(L3_index * cores_per_L3 + i, &cpuset); - pthread_setaffinity_np(thread, sizeof(cpuset), &cpuset); - #endif -+#endif - } - - /** -@@ -124,6 +136,35 @@ static inline int - util_get_L3_for_pinned_thread(thrd_t thread, unsigned cores_per_L3) - { - #if defined(HAVE_PTHREAD_SETAFFINITY) -+#if defined(__NetBSD__) -+ cpuset_t *cpuset; -+ -+ cpuset = cpuset_create(); -+ if (cpuset == NULL) -+ return -1; -+ -+ if (pthread_getaffinity_np(thread, cpuset_size(cpuset), cpuset) == 0) { -+ int L3_index = -1; -+ -+ for (unsigned i = 0; i < cpuset_size(cpuset); i++) { -+ if (cpuset_isset(i, cpuset)) { -+ int x = i / cores_per_L3; -+ -+ if (L3_index != x) { -+ if (L3_index == -1) -+ L3_index = x; -+ else { -+ cpuset_destroy(cpuset); -+ return -1; /* multiple L3s are set */ -+ } -+ } -+ } ++ memset(old_mask, 0, num_mask_bits / 8); ++ for (unsigned i = 0; i < num_mask_bits && i < CPU_SETSIZE; i++) { ++ if (cpuset_isset(i, cpuset)) ++ old_mask[i / 32] |= 1u << (i % 32); + } -+ cpuset_destroy(cpuset); -+ return L3_index; + } ++ ++ cpuset_zero(cpuset); ++ for (unsigned i = 0; i < num_mask_bits && i < CPU_SETSIZE; i++) { ++ if (mask[i / 32] & (1u << (i % 32))) ++ cpuset_set(i, cpuset); ++ } ++ int err = pthread_setaffinity_np(thread, cpuset_size(cpuset), cpuset); + cpuset_destroy(cpuset); -+#else - cpu_set_t cpuset; - - if (pthread_getaffinity_np(thread, sizeof(cpuset), &cpuset) == 0) { -@@ -144,6 +185,7 @@ util_get_L3_for_pinned_thread(thrd_t thr - return L3_index; ++ return err == 0; ++# else ++ cpu_set_t cpuset; + if (old_mask) { + if (pthread_getaffinity_np(thread, sizeof(cpuset), &cpuset) != 0) + return false; +@@ -188,7 +212,7 @@ util_set_thread_affinity(thrd_t thread, + CPU_SET(i, &cpuset); } - #endif -+#endif - return -1; - } + return pthread_setaffinity_np(thread, sizeof(cpuset), &cpuset) == 0; +- ++# endif + #elif defined(_WIN32) && !defined(__CYGWIN__) + DWORD_PTR m = mask[0]; -@@ -155,7 +197,7 @@ util_get_L3_for_pinned_thread(thrd_t thr +@@ -242,7 +266,7 @@ util_set_current_thread_affinity(const u static inline int64_t - u_thread_get_time_nano(thrd_t thread) + util_thread_get_time_nano(thrd_t thread) { -#if defined(HAVE_PTHREAD) && !defined(__APPLE__) && !defined(__HAIKU__) +#if defined(HAVE_PTHREAD) && !defined(__APPLE__) && !defined(__HAIKU__) && !defined(__sun) -- cgit v1.2.3