From ce4c96ea1bce9f2f85fccc33bda9277bd6339139 Mon Sep 17 00:00:00 2001 From: Jan Zielinski Date: Thu, 10 Jun 2021 13:16:04 +0200 Subject: [PATCH] gallium/swr: clean up the documentation after SWR removal from main Reviewed-by: Dylan Baker Part-of: --- docs/conf.py | 5 - docs/drivers/openswr.rst | 24 ----- docs/drivers/openswr/faq.rst | 141 ----------------------------- docs/drivers/openswr/knobs.rst | 114 ----------------------- docs/drivers/openswr/profiling.rst | 67 -------------- docs/drivers/openswr/usage.rst | 38 -------- docs/envvars.rst | 3 +- docs/features.txt | 138 ++++++++++++++-------------- docs/history.rst | 3 +- docs/index.rst | 1 - docs/meson.rst | 1 - docs/sourcetree.rst | 1 - docs/systems.rst | 2 - 13 files changed, 71 insertions(+), 467 deletions(-) delete mode 100644 docs/drivers/openswr.rst delete mode 100644 docs/drivers/openswr/faq.rst delete mode 100644 docs/drivers/openswr/knobs.rst delete mode 100644 docs/drivers/openswr/profiling.rst delete mode 100644 docs/drivers/openswr/usage.rst diff --git a/docs/conf.py b/docs/conf.py index ba789390467..998f209e998 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -139,11 +139,6 @@ html_redirects = [ ('gallium/drivers/freedreno', 'drivers/freedreno.html'), ('gallium/drivers/freedreno/ir3-notes', 'drivers/freedreno/ir3-notes.html'), ('gallium/drivers/llvmpipe', 'drivers/llvmpipe.html'), - ('gallium/drivers/openswr', 'drivers/openswr.html'), - ('gallium/drivers/openswr/faq', 'drivers/openswr/faq.html'), - ('gallium/drivers/openswr/knobs', 'drivers/openswr/knobs.html'), - ('gallium/drivers/openswr/profiling', 'drivers/openswr/profiling.html'), - ('gallium/drivers/openswr/usage', 'drivers/openswr/usage.html'), ('gallium/drivers/zink', 'drivers/zink.html'), ('llvmpipe', 'drivers/llvmpipe.html'), ('postprocess', 'gallium/postprocess.html'), diff --git a/docs/drivers/openswr.rst b/docs/drivers/openswr.rst deleted file mode 100644 index 4435219c8a1..00000000000 --- a/docs/drivers/openswr.rst +++ /dev/null @@ -1,24 +0,0 @@ -OpenSWR -======= - -The Gallium OpenSWR driver is a high performance, highly scalable -software renderer targeted towards visualization workloads. For such -geometry heavy workloads there is a considerable speedup over llvmpipe, -which is to be expected as the geometry frontend of llvmpipe is single -threaded. - -This rasterizer is x86 specific and requires AVX or above. The driver -fits into the gallium framework, and reuses gallivm for doing the TGSI -to vectorized llvm-IR conversion of the shader kernels. - -You can read more about OpenSWR on the `project website -`__. - -.. toctree:: - :glob: - - openswr/usage - openswr/faq - openswr/profiling - openswr/knobs - diff --git a/docs/drivers/openswr/faq.rst b/docs/drivers/openswr/faq.rst deleted file mode 100644 index 1d058f92222..00000000000 --- a/docs/drivers/openswr/faq.rst +++ /dev/null @@ -1,141 +0,0 @@ -FAQ -=== - -Why another software rasterizer? --------------------------------- - -Good question, given there are already three (swrast, softpipe, -llvmpipe) in the Mesa tree. Two important reasons for this: - - * Architecture - given our focus on scientific visualization, our - workloads are much different than the typical game; we have heavy - vertex load and relatively simple shaders. In addition, the core - counts of machines we run on are much higher. These parameters led - to design decisions much different than llvmpipe. - - * Historical - Intel had developed a high performance software - graphics stack for internal purposes. Later we adapted this - graphics stack for use in visualization and decided to move forward - with Mesa to provide a high quality API layer while at the same - time benefiting from the excellent performance the software - rasterizerizer gives us. - -What's the architecture? ------------------------- - -SWR is a tile based immediate mode renderer with a sort-free threading -model which is arranged as a ring of queues. Each entry in the ring -represents a draw context that contains all of the draw state and work -queues. An API thread sets up each draw context and worker threads -will execute both the frontend (vertex/geometry processing) and -backend (fragment) work as required. The ring allows for backend -threads to pull work in order. Large draws are split into chunks to -allow vertex processing to happen in parallel, with the backend work -pickup preserving draw ordering. - -Our pipeline uses just-in-time compiled code for the fetch shader that -does vertex attribute gathering and AOS to SOA conversions, the vertex -shader and fragment shaders, streamout, and fragment blending. SWR -core also supports geometry and compute shaders but we haven't exposed -them through our driver yet. The fetch shader, streamout, and blend is -built internally to swr core using LLVM directly, while for the vertex -and pixel shaders we reuse bits of llvmpipe from -``gallium/auxiliary/gallivm`` to build the kernels, which we wrap -differently than llvmpipe's ``auxiliary/draw`` code. - -What's the performance? ------------------------ - -For the types of high-geometry workloads we're interested in, we are -significantly faster than llvmpipe. This is to be expected, as -llvmpipe only threads the fragment processing and not the geometry -frontend. The performance advantage over llvmpipe roughly scales -linearly with the number of cores available. - -While our current performance is quite good, we know there is more -potential in this architecture. When we switched from a prototype -OpenGL driver to Mesa we regressed performance severely, some due to -interface issues that need tuning, some differences in shader code -generation, and some due to conformance and feature additions to the -core swr. We are looking to recovering most of this performance back. - -What's the conformance? ------------------------ - -The major applications we are targeting are all based on the -Visualization Toolkit (VTK), and as such our development efforts have -been focused on making sure these work as best as possible. Our -current code passes vtk's rendering tests with their new "OpenGL2" -(really OpenGL 3.2) backend at 99%. - -piglit testing shows a much lower pass rate, roughly 80% at the time -of writing. Core SWR undergoes rigorous unit testing and we are quite -confident in the rasterizer, and understand the areas where it -currently has issues (example: line rendering is done with triangles, -so doesn't match the strict line rendering rules). The majority of -the piglit failures are errors in our driver layer interfacing Mesa -and SWR. Fixing these issues is one of our major future development -goals. - -Why are you open sourcing this? -------------------------------- - - * Our customers prefer open source, and allowing them to simply - download the Mesa source and enable our driver makes life much - easier for them. - - * The internal gallium APIs are not stable, so we'd like our driver - to be visible for changes. - - * It's easier to work with the Mesa community when the source we're - working with can be used as reference. - -What are your development plans? --------------------------------- - - * Performance - see the performance section earlier for details. - - * Conformance - see the conformance section earlier for details. - - * Features - core SWR has a lot of functionality we have yet to - expose through our driver, such as MSAA, geometry shaders, compute - shaders, and tesselation. - - * AVX512 support - -What is the licensing of the code? ----------------------------------- - - * All code is under the normal Mesa MIT license. - -Will this work on AMD? ----------------------- - - * If using an AMD processor with AVX or AVX2, it should work though - we don't have that hardware around to test. Patches if needed - would be welcome. - -Will this work on ARM, MIPS, POWER, ? -------------------------------------------------------------------------- - - * Not without a lot of work. We make extensive use of AVX and AVX2 - intrinsics in our code and the in-tree JIT creation. It is not the - intention for this codebase to support non-x86 architectures. - -What hardware do I need? ------------------------- - - * Any x86 processor with at least AVX (introduced in the Intel - SandyBridge and AMD Bulldozer microarchitectures in 2011) will - work. - - * You don't need a fire-breathing Xeon machine to work on SWR - we do - day-to-day development with laptops and desktop CPUs. - -Does one build work on both AVX and AVX2? ------------------------------------------ - -Yes. The build system creates two shared libraries, ``libswrAVX.so`` and -``libswrAVX2.so``, and ``swr_create_screen()`` loads the appropriate one at -runtime. - diff --git a/docs/drivers/openswr/knobs.rst b/docs/drivers/openswr/knobs.rst deleted file mode 100644 index 06f228a2e92..00000000000 --- a/docs/drivers/openswr/knobs.rst +++ /dev/null @@ -1,114 +0,0 @@ -Knobs -===== - -OpenSWR has a number of environment variables which control its -operation, in addition to the normal Mesa and gallium controls. - -.. envvar:: KNOB_ENABLE_ASSERT_DIALOGS (true) - -Use dialogs when asserts fire. Asserts are only enabled in debug builds - -.. envvar:: KNOB_SINGLE_THREADED (false) - -If enabled will perform all rendering on the API thread. This is useful mainly for debugging purposes. - -.. envvar:: KNOB_DUMP_SHADER_IR (false) - -Dumps shader LLVM IR at various stages of jit compilation. - -.. envvar:: KNOB_USE_GENERIC_STORETILE (false) - -Always use generic function for performing StoreTile. Will be slightly slower than using optimized (jitted) path - -.. envvar:: KNOB_FAST_CLEAR (true) - -Replace 3D primitive execute with a SWRClearRT operation and defer clear execution to first backend op on hottile, or hottile store - -.. envvar:: KNOB_MAX_NUMA_NODES (0) - -Maximum # of NUMA-nodes per system used for worker threads 0 == ALL NUMA-nodes in the system N == Use at most N NUMA-nodes for rendering - -.. envvar:: KNOB_MAX_CORES_PER_NUMA_NODE (0) - -Maximum # of cores per NUMA-node used for worker threads. 0 == ALL non-API thread cores per NUMA-node N == Use at most N cores per NUMA-node - -.. envvar:: KNOB_MAX_THREADS_PER_CORE (1) - -Maximum # of (hyper)threads per physical core used for worker threads. 0 == ALL hyper-threads per core N == Use at most N hyper-threads per physical core - -.. envvar:: KNOB_MAX_WORKER_THREADS (0) - -Maximum worker threads to spawn. IMPORTANT: If this is non-zero, no worker threads will be bound to specific HW threads. They will all be "floating" SW threads. In this case, the above 3 KNOBS will be ignored. - -.. envvar:: KNOB_BUCKETS_START_FRAME (1200) - -Frame from when to start saving buckets data. NOTE: KNOB_ENABLE_RDTSC must be enabled in core/knobs.h for this to have an effect. - -.. envvar:: KNOB_BUCKETS_END_FRAME (1400) - -Frame at which to stop saving buckets data. NOTE: KNOB_ENABLE_RDTSC must be enabled in core/knobs.h for this to have an effect. - -.. envvar:: KNOB_WORKER_SPIN_LOOP_COUNT (5000) - -Number of spin-loop iterations worker threads will perform before going to sleep when waiting for work - -.. envvar:: KNOB_MAX_DRAWS_IN_FLIGHT (160) - -Maximum number of draws outstanding before API thread blocks. - -.. envvar:: KNOB_MAX_PRIMS_PER_DRAW (2040) - -Maximum primitives in a single Draw(). Larger primitives are split into smaller Draw calls. Should be a multiple of (3 * vectorWidth). - -.. envvar:: KNOB_MAX_TESS_PRIMS_PER_DRAW (16) - -Maximum primitives in a single Draw() with tessellation enabled. Larger primitives are split into smaller Draw calls. Should be a multiple of (vectorWidth). - -.. envvar:: KNOB_MAX_FRAC_ODD_TESS_FACTOR (63.0f) - -(DEBUG) Maximum tessellation factor for fractional-odd partitioning. - -.. envvar:: KNOB_MAX_FRAC_EVEN_TESS_FACTOR (64.0f) - -(DEBUG) Maximum tessellation factor for fractional-even partitioning. - -.. envvar:: KNOB_MAX_INTEGER_TESS_FACTOR (64) - -(DEBUG) Maximum tessellation factor for integer partitioning. - -.. envvar:: KNOB_BUCKETS_ENABLE_THREADVIZ (false) - -Enable threadviz output. - -.. envvar:: KNOB_TOSS_DRAW (false) - -Disable per-draw/dispatch execution - -.. envvar:: KNOB_TOSS_QUEUE_FE (false) - -Stop per-draw execution at worker FE NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - -.. envvar:: KNOB_TOSS_FETCH (false) - -Stop per-draw execution at vertex fetch NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - -.. envvar:: KNOB_TOSS_IA (false) - -Stop per-draw execution at input assembler NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - -.. envvar:: KNOB_TOSS_VS (false) - -Stop per-draw execution at vertex shader NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - -.. envvar:: KNOB_TOSS_SETUP_TRIS (false) - -Stop per-draw execution at primitive setup NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - -.. envvar:: KNOB_TOSS_BIN_TRIS (false) - -Stop per-draw execution at primitive binning NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - -.. envvar:: KNOB_TOSS_RS (false) - -Stop per-draw execution at rasterizer NOTE: Requires KNOB_ENABLE_TOSS_POINTS to be enabled in core/knobs.h - diff --git a/docs/drivers/openswr/profiling.rst b/docs/drivers/openswr/profiling.rst deleted file mode 100644 index 357754c3506..00000000000 --- a/docs/drivers/openswr/profiling.rst +++ /dev/null @@ -1,67 +0,0 @@ -Profiling -========= - -OpenSWR contains built-in profiling which can be enabled -at build time to provide insight into performance tuning. - -To enable this, uncomment the following line in ``rasterizer/core/knobs.h`` and rebuild: :: - - //#define KNOB_ENABLE_RDTSC - -Running an application will result in a ``rdtsc.txt`` file being -created in current working directory. This file contains profile -information captured between the ``KNOB_BUCKETS_START_FRAME`` and -``KNOB_BUCKETS_END_FRAME`` (see knobs section). - -The resulting file will contain sections for each thread with a -hierarchical breakdown of the time spent in the various operations. -For example: :: - - Thread 0 (API) - %Tot %Par Cycles CPE NumEvent CPE2 NumEvent2 Bucket - 0.00 0.00 28370 2837 10 0 0 APIClearRenderTarget - 0.00 41.23 11698 1169 10 0 0 |-> APIDrawWakeAllThreads - 0.00 18.34 5202 520 10 0 0 |-> APIGetDrawContext - 98.72 98.72 12413773688 29957 414380 0 0 APIDraw - 0.36 0.36 44689364 107 414380 0 0 |-> APIDrawWakeAllThreads - 96.36 97.62 12117951562 9747 1243140 0 0 |-> APIGetDrawContext - 0.00 0.00 19904 995 20 0 0 APIStoreTiles - 0.00 7.88 1568 78 20 0 0 |-> APIDrawWakeAllThreads - 0.00 25.28 5032 251 20 0 0 |-> APIGetDrawContext - 1.28 1.28 161344902 64 2486370 0 0 APIGetDrawContext - 0.00 0.00 50368 2518 20 0 0 APISync - 0.00 2.70 1360 68 20 0 0 |-> APIDrawWakeAllThreads - 0.00 65.27 32876 1643 20 0 0 |-> APIGetDrawContext - - - Thread 1 (WORKER) - %Tot %Par Cycles CPE NumEvent CPE2 NumEvent2 Bucket - 83.92 83.92 13198987522 96411 136902 0 0 FEProcessDraw - 24.91 29.69 3918184840 167 23410158 0 0 |-> FEFetchShader - 11.17 13.31 1756972646 75 23410158 0 0 |-> FEVertexShader - 8.89 10.59 1397902996 59 23410161 0 0 |-> FEPAAssemble - 19.06 22.71 2997794710 384 7803387 0 0 |-> FEClipTriangles - 11.67 61.21 1834958176 235 7803387 0 0 |-> FEBinTriangles - 0.00 0.00 0 0 187258 0 0 |-> FECullZeroAreaAndBackface - 0.00 0.00 0 0 60051033 0 0 |-> FECullBetweenCenters - 0.11 0.11 17217556 2869592 6 0 0 FEProcessStoreTiles - 15.97 15.97 2511392576 73665 34092 0 0 WorkerWorkOnFifoBE - 14.04 87.95 2208687340 9187 240408 0 0 |-> WorkerFoundWork - 0.06 0.43 9390536 13263 708 0 0 |-> BELoadTiles - 0.00 0.01 293020 182 1609 0 0 |-> BEClear - 12.63 89.94 1986508990 949 2093014 0 0 |-> BERasterizeTriangle - 2.37 18.75 372374596 177 2093014 0 0 |-> BETriangleSetup - 0.42 3.35 66539016 31 2093014 0 0 |-> BEStepSetup - 0.00 0.00 0 0 21766 0 0 |-> BETrivialReject - 1.05 8.33 165410662 79 2071248 0 0 |-> BERasterizePartial - 6.06 48.02 953847796 1260 756783 0 0 |-> BEPixelBackend - 0.20 3.30 31521202 41 756783 0 0 |-> BESetup - 0.16 2.69 25624304 33 756783 0 0 |-> BEBarycentric - 0.18 2.92 27884986 36 756783 0 0 |-> BEEarlyDepthTest - 0.19 3.20 30564174 41 744058 0 0 |-> BEPixelShader - 0.26 4.30 41058646 55 744058 0 0 |-> BEOutputMerger - 1.27 20.94 199750822 32 6054264 0 0 |-> BEEndTile - 0.33 2.34 51758160 23687 2185 0 0 |-> BEStoreTiles - 0.20 60.22 31169500 28807 1082 0 0 |-> B8G8R8A8_UNORM - 0.00 0.00 302752 302752 1 0 0 WorkerWaitForThreadEvent - diff --git a/docs/drivers/openswr/usage.rst b/docs/drivers/openswr/usage.rst deleted file mode 100644 index 1fb5e04a13b..00000000000 --- a/docs/drivers/openswr/usage.rst +++ /dev/null @@ -1,38 +0,0 @@ -Usage -===== - -Requirements -^^^^^^^^^^^^ - -* An x86 processor with AVX or above -* LLVM version 3.9 or later -* C++14 capable compiler - -Building -^^^^^^^^ - -To build with GNU automake, select building the swr driver at -configure time, for example: :: - - configure --with-gallium-drivers=swrast,swr - -Using -^^^^^ - -On Linux, building with autotools will create a drop-in alternative -for libGL.so into:: - - lib/gallium/libGL.so - lib/gallium/libswrAVX.so - lib/gallium/libswrAVX2.so - -To use it set the LD_LIBRARY_PATH environment variable accordingly. - -**IMPORTANT:** Mesa will default to using llvmpipe or softpipe as the default software renderer. To select the OpenSWR driver, set the GALLIUM_DRIVER environment variable appropriately: :: - - GALLIUM_DRIVER=swr - -To verify OpenSWR is being used, check to see if a message like the following is printed when the application is started: :: - - SWR detected AVX2 - diff --git a/docs/envvars.rst b/docs/envvars.rst index 9a29c168f86..1068f6dd79d 100644 --- a/docs/envvars.rst +++ b/docs/envvars.rst @@ -449,8 +449,7 @@ Gallium environment variables files. :envvar:`GALLIUM_DRIVER` useful in combination with :envvar:`LIBGL_ALWAYS_SOFTWARE`=`true` for - choosing one of the software renderers ``softpipe``, ``llvmpipe`` or - ``swr``. + choosing one of the software renderers ``softpipe`` or ``llvmpipe``. :envvar:`GALLIUM_LOG_FILE` specifies a file for logging all errors, warnings, etc. rather than stderr. diff --git a/docs/features.txt b/docs/features.txt index 9357529e64c..2b4e96b3829 100644 --- a/docs/features.txt +++ b/docs/features.txt @@ -36,7 +36,7 @@ context as extensions. Feature Status ------------------------------------------------------- ------------------------ -GL 3.0, GLSL 1.30 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, swr, virgl, zink, d3d12, panfrost +GL 3.0, GLSL 1.30 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, virgl, zink, d3d12, panfrost glBindFragDataLocation, glGetFragDataLocation DONE GL_NV_conditional_render (Conditional rendering) DONE () @@ -63,13 +63,13 @@ GL 3.0, GLSL 1.30 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llv glVertexAttribI commands DONE Depth format cube textures DONE () GLX_ARB_create_context (GLX 1.4 is required) DONE (v3d, vc4) - Multisample anti-aliasing DONE (freedreno/a5xx+, freedreno (*), llvmpipe (*), softpipe (*), swr (*)) + Multisample anti-aliasing DONE (freedreno/a5xx+, freedreno (*), llvmpipe (*), softpipe (*))) 8 draw buffers DONE (panfrost/t760+) -(*) freedreno (a2xx-a4xx), llvmpipe, softpipe, and swr have fake Multisample anti-aliasing support +(*) freedreno (a2xx-a4xx), llvmpipe, and softpipe have fake Multisample anti-aliasing support -GL 3.1, GLSL 1.40 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, swr, virgl, zink, d3d12, panfrost +GL 3.1, GLSL 1.40 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, virgl, zink, d3d12, panfrost Forward compatible context support/deprecations DONE GL_ARB_draw_instanced (Instanced drawing) DONE (v3d) @@ -82,7 +82,7 @@ GL 3.1, GLSL 1.40 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llv GL_EXT_texture_snorm (Signed normalized textures) DONE (v3d) -GL 3.2, GLSL 1.50 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, swr, virgl, zink, d3d12 +GL 3.2, GLSL 1.50 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, virgl, zink, d3d12 Core/compatibility profiles DONE Geometry shaders DONE (freedreno/a6xx) @@ -99,70 +99,70 @@ GL 3.2, GLSL 1.50 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llv GL 3.3, GLSL 3.30 --- all DONE: freedreno, i965, nv50, nvc0, r600, radeonsi, llvmpipe, softpipe, virgl, zink, d3d12 - GL_ARB_blend_func_extended DONE (freedreno/a3xx, freedreno/a6xx, swr, panfrost, lima) + GL_ARB_blend_func_extended DONE (freedreno/a3xx, freedreno/a6xx, panfrost, lima) GL_ARB_explicit_attrib_location DONE (all drivers that support GLSL) - GL_ARB_occlusion_query2 DONE (swr, v3d, vc4, panfrost, lima) + GL_ARB_occlusion_query2 DONE (v3d, vc4, panfrost, lima) GL_ARB_sampler_objects DONE (all drivers) - GL_ARB_shader_bit_encoding DONE (swr, v3d, panfrost) - GL_ARB_texture_rgb10_a2ui DONE (swr, panfrost) - GL_ARB_texture_swizzle DONE (swr, v3d, vc4, panfrost, lima) - GL_ARB_timer_query DONE (swr) - GL_ARB_instanced_arrays DONE (swr, v3d, panfrost) - GL_ARB_vertex_type_2_10_10_10_rev DONE (swr, v3d, panfrost) + GL_ARB_shader_bit_encoding DONE (v3d, panfrost) + GL_ARB_texture_rgb10_a2ui DONE (panfrost) + GL_ARB_texture_swizzle DONE (v3d, vc4, panfrost, lima) + GL_ARB_timer_query DONE () + GL_ARB_instanced_arrays DONE (v3d, panfrost) + GL_ARB_vertex_type_2_10_10_10_rev DONE (v3d, panfrost) GL 4.0, GLSL 4.00 --- all DONE: i965/gen7+, nvc0, r600, radeonsi, llvmpipe, virgl, zink - GL_ARB_draw_buffers_blend DONE (freedreno, i965/gen6+, nv50, softpipe, swr, panfrost, d3d12) - GL_ARB_draw_indirect DONE (freedreno, i965/gen7+, softpipe, swr, v3d) + GL_ARB_draw_buffers_blend DONE (freedreno, i965/gen6+, nv50, softpipe, panfrost, d3d12) + GL_ARB_draw_indirect DONE (freedreno, i965/gen7+, softpipe, v3d) GL_ARB_gpu_shader5 DONE (i965/gen7+) - 'precise' qualifier DONE (softpipe) - Dynamically uniform sampler array indices DONE (softpipe) - Dynamically uniform UBO array indices DONE (freedreno, softpipe) - - Implicit signed -> unsigned conversions DONE (softpipe, swr) - - Fused multiply-add DONE (softpipe, swr) - - Packing/bitfield/conversion functions DONE (freedreno, softpipe, swr, panfrost) - - Enhanced textureGather DONE (freedreno, softpipe, swr, panfrost) - - Geometry shader instancing DONE (softpipe, swr) - - Geometry shader multiple streams DONE (softpipe, swr) + - Implicit signed -> unsigned conversions DONE (softpipe, ) + - Fused multiply-add DONE (softpipe, ) + - Packing/bitfield/conversion functions DONE (freedreno, softpipe, panfrost) + - Enhanced textureGather DONE (freedreno, softpipe, panfrost) + - Geometry shader instancing DONE (softpipe, ) + - Geometry shader multiple streams DONE (softpipe, ) - Enhanced per-sample shading DONE () - Interpolation functions DONE (softpipe) - New overload resolution rules DONE (softpipe) - GL_ARB_gpu_shader_fp64 DONE (i965/gen7+, softpipe, swr) + GL_ARB_gpu_shader_fp64 DONE (i965/gen7+, softpipe, ) GL_ARB_sample_shading DONE (freedreno/a6xx, i965/gen6+, nv50, panfrost) - GL_ARB_shader_subroutine DONE (freedreno, i965/gen6+, nv50, softpipe, swr, d3d12) - GL_ARB_tessellation_shader DONE (freedreno/a6xx, i965/gen7+, swr) - GL_ARB_texture_buffer_object_rgb32 DONE (freedreno, i965/gen6+, softpipe, swr, d3d12, panfrost) - GL_ARB_texture_cube_map_array DONE (freedreno/a4xx+, i965/gen6+, nv50, softpipe, swr) - GL_ARB_texture_gather DONE (freedreno, i965/gen6+, nv50, softpipe, swr, v3d, panfrost) - GL_ARB_texture_query_lod DONE (freedreno, i965, nv50, softpipe, swr, v3d, panfrost, d3d12) - GL_ARB_transform_feedback2 DONE (freedreno/a3xx+, i965/gen6+, nv50, softpipe, swr, v3d, panfrost) - GL_ARB_transform_feedback3 DONE (freedreno/a3xx+, i965/gen7+, softpipe, swr) + GL_ARB_shader_subroutine DONE (freedreno, i965/gen6+, nv50, softpipe, d3d12) + GL_ARB_tessellation_shader DONE (freedreno/a6xx, i965/gen7+, ) + GL_ARB_texture_buffer_object_rgb32 DONE (freedreno, i965/gen6+, softpipe, d3d12, panfrost) + GL_ARB_texture_cube_map_array DONE (freedreno/a4xx+, i965/gen6+, nv50, softpipe, ) + GL_ARB_texture_gather DONE (freedreno, i965/gen6+, nv50, softpipe, v3d, panfrost) + GL_ARB_texture_query_lod DONE (freedreno, i965, nv50, softpipe, v3d, panfrost, d3d12) + GL_ARB_transform_feedback2 DONE (freedreno/a3xx+, i965/gen6+, nv50, softpipe, v3d, panfrost) + GL_ARB_transform_feedback3 DONE (freedreno/a3xx+, i965/gen7+, softpipe, ) GL 4.1, GLSL 4.10 --- all DONE: i965/gen7+, nvc0, r600, radeonsi, llvmpipe, virgl, zink - GL_ARB_ES2_compatibility DONE (freedreno, i965, nv50, softpipe, swr, v3d, vc4, panfrost, d3d12, lima) + GL_ARB_ES2_compatibility DONE (freedreno, i965, nv50, softpipe, v3d, vc4, panfrost, d3d12, lima) GL_ARB_get_program_binary DONE (freedreno, 0 or 1 binary formats) GL_ARB_separate_shader_objects DONE (all drivers) GL_ARB_shader_precision DONE (i965/gen7+, all drivers that support GLSL 4.10) - GL_ARB_vertex_attrib_64bit DONE (i965/gen7+, softpipe, swr) - GL_ARB_viewport_array DONE (i965, nv50, softpipe, swr) + GL_ARB_vertex_attrib_64bit DONE (i965/gen7+, softpipe, ) + GL_ARB_viewport_array DONE (i965, nv50, softpipe, ) GL 4.2, GLSL 4.20 -- all DONE: i965/gen7+, nvc0, r600, radeonsi, llvmpipe, virgl, zink - GL_ARB_texture_compression_bptc DONE (freedreno, i965, softpipe, swr, panfrost/if SoC supports) + GL_ARB_texture_compression_bptc DONE (freedreno, i965, softpipe, panfrost/if SoC supports) GL_ARB_compressed_texture_pixel_storage DONE (all drivers) GL_ARB_shader_atomic_counters DONE (freedreno/a5xx+, i965, softpipe, v3d, panfrost) GL_ARB_texture_storage DONE (all drivers) - GL_ARB_transform_feedback_instanced DONE (freedreno, i965, nv50, softpipe, swr, v3d) - GL_ARB_base_instance DONE (freedreno, i965, nv50, softpipe, swr, v3d) + GL_ARB_transform_feedback_instanced DONE (freedreno, i965, nv50, softpipe, v3d) + GL_ARB_base_instance DONE (freedreno, i965, nv50, softpipe, v3d) GL_ARB_shader_image_load_store DONE (freedreno/a5xx+, i965, softpipe, v3d, panfrost) GL_ARB_conservative_depth DONE (all drivers that support GLSL 1.30) GL_ARB_shading_language_420pack DONE (all drivers that support GLSL 1.30) GL_ARB_shading_language_packing DONE (all drivers) - GL_ARB_internalformat_query DONE (freedreno, i965, nv50, softpipe, swr, v3d, vc4, panfrost, d3d12, lima) + GL_ARB_internalformat_query DONE (freedreno, i965, nv50, softpipe, v3d, vc4, panfrost, d3d12, lima) GL_ARB_map_buffer_alignment DONE (all drivers) @@ -172,31 +172,31 @@ GL 4.3, GLSL 4.30 -- all DONE: i965/gen8+, nvc0, r600, radeonsi, llvmpipe, virgl GL_ARB_ES3_compatibility DONE (all drivers that support GLSL 3.30) GL_ARB_clear_buffer_object DONE (all drivers) GL_ARB_compute_shader DONE (freedreno/a5xx+, i965, softpipe, v3d, panfrost) - GL_ARB_copy_image DONE (i965, nv50, softpipe, swr) + GL_ARB_copy_image DONE (i965, nv50, softpipe, ) GL_KHR_debug DONE (all drivers) GL_ARB_explicit_uniform_location DONE (all drivers that support GLSL) - GL_ARB_fragment_layer_viewport DONE (i965, nv50, softpipe, swr) + GL_ARB_fragment_layer_viewport DONE (i965, nv50, softpipe, ) GL_ARB_framebuffer_no_attachments DONE (freedreno, i965, softpipe, v3d) GL_ARB_internalformat_query2 DONE (all drivers) GL_ARB_invalidate_subdata DONE (all drivers) - GL_ARB_multi_draw_indirect DONE (freedreno, i965, softpipe, swr, v3d) + GL_ARB_multi_draw_indirect DONE (freedreno, i965, softpipe, v3d) GL_ARB_program_interface_query DONE (all drivers) GL_ARB_robust_buffer_access_behavior DONE (freedreno, i965) GL_ARB_shader_image_size DONE (freedreno/a5xx+, i965, softpipe, v3d, panfrost) GL_ARB_shader_storage_buffer_object DONE (freedreno/a5xx+, i965, softpipe, v3d, panfrost) - GL_ARB_stencil_texturing DONE (freedreno, i965/hsw+, nv50, softpipe, swr, v3d, panfrost, d3d12) - GL_ARB_texture_buffer_range DONE (freedreno, nv50, i965, softpipe, swr, v3d, d3d12) + GL_ARB_stencil_texturing DONE (freedreno, i965/hsw+, nv50, softpipe, v3d, panfrost, d3d12) + GL_ARB_texture_buffer_range DONE (freedreno, nv50, i965, softpipe, v3d, d3d12) GL_ARB_texture_query_levels DONE (all drivers that support GLSL 1.30) GL_ARB_texture_storage_multisample DONE (all drivers that support GL_ARB_texture_multisample) - GL_ARB_texture_view DONE (freedreno, i965, nv50, softpipe, swr, v3d) + GL_ARB_texture_view DONE (freedreno, i965, nv50, softpipe, v3d) GL_ARB_vertex_attrib_binding DONE (all drivers) GL 4.4, GLSL 4.40 -- all DONE: i965/gen8+, nvc0, r600, radeonsi, llvmpipe, zink GL_MAX_VERTEX_ATTRIB_STRIDE DONE (all drivers) - GL_ARB_buffer_storage DONE (freedreno, i965, nv50, swr, v3d, vc4) - GL_ARB_clear_texture DONE (i965, nv50, softpipe, swr, virgl) + GL_ARB_buffer_storage DONE (freedreno, i965, nv50, v3d, vc4) + GL_ARB_clear_texture DONE (i965, nv50, softpipe, virgl) GL_ARB_enhanced_layouts DONE (i965, nv50, softpipe, virgl) - compile-time constant expressions DONE - explicit byte offsets for blocks DONE @@ -206,16 +206,16 @@ GL 4.4, GLSL 4.40 -- all DONE: i965/gen8+, nvc0, r600, radeonsi, llvmpipe, zink - input/output block locations DONE GL_ARB_multi_bind DONE (all drivers) GL_ARB_query_buffer_object DONE (i965/hsw+, virgl) - GL_ARB_texture_mirror_clamp_to_edge DONE (i965, nv50, softpipe, swr, virgl, v3d, panfrost) - GL_ARB_texture_stencil8 DONE (freedreno, i965/hsw+, nv50, softpipe, swr, virgl, v3d, panfrost, d3d12) - GL_ARB_vertex_type_10f_11f_11f_rev DONE (freedreno, i965, nv50, softpipe, swr, virgl, panfrost, d3d12) + GL_ARB_texture_mirror_clamp_to_edge DONE (i965, nv50, softpipe, virgl, v3d, panfrost) + GL_ARB_texture_stencil8 DONE (freedreno, i965/hsw+, nv50, softpipe, virgl, v3d, panfrost, d3d12) + GL_ARB_vertex_type_10f_11f_11f_rev DONE (freedreno, i965, nv50, softpipe, virgl, panfrost, d3d12) GL 4.5, GLSL 4.50 -- all DONE: nvc0, r600, radeonsi, llvmpipe, zink GL_ARB_ES3_1_compatibility DONE (i965/hsw+, softpipe, virgl) - GL_ARB_clip_control DONE (freedreno, i965, nv50, softpipe, swr, virgl, lima) - GL_ARB_conditional_render_inverted DONE (freedreno, i965, nv50, softpipe, swr, virgl, panfrost) - GL_ARB_cull_distance DONE (freedreno/a6xx, i965, nv50, softpipe, swr, virgl) + GL_ARB_clip_control DONE (freedreno, i965, nv50, softpipe, virgl, lima) + GL_ARB_conditional_render_inverted DONE (freedreno, i965, nv50, softpipe, virgl, panfrost) + GL_ARB_cull_distance DONE (freedreno/a6xx, i965, nv50, softpipe, virgl) GL_ARB_derivative_control DONE (i965, nv50, softpipe, virgl) GL_ARB_direct_state_access DONE (all drivers) GL_ARB_get_texture_sub_image DONE (all drivers) @@ -229,8 +229,8 @@ GL 4.6, GLSL 4.60 -- all DONE: radeonsi, zink GL_ARB_gl_spirv DONE (i965/gen7+, llvmpipe) GL_ARB_indirect_parameters DONE (i965/gen7+, nvc0, llvmpipe, virgl) - GL_ARB_pipeline_statistics_query DONE (i965, nvc0, r600, llvmpipe, softpipe, swr) - GL_ARB_polygon_offset_clamp DONE (freedreno, i965, nv50, nvc0, r600, llvmpipe, swr, virgl) + GL_ARB_pipeline_statistics_query DONE (i965, nvc0, r600, llvmpipe, softpipe, ) + GL_ARB_polygon_offset_clamp DONE (freedreno, i965, nv50, nvc0, r600, llvmpipe, virgl) GL_ARB_shader_atomic_counter_ops DONE (freedreno/a5xx+, i965/gen7+, nvc0, r600, llvmpipe, softpipe, virgl, v3d) GL_ARB_shader_draw_parameters DONE (i965, llvmpipe, nvc0) GL_ARB_shader_group_vote DONE (i965, nvc0, llvmpipe) @@ -244,18 +244,18 @@ GLES3.1, GLSL ES 3.1 -- all DONE: i965/hsw+, nvc0, r600, radeonsi, virgl, v3d, s GL_ARB_arrays_of_arrays DONE (all drivers that support GLSL 1.30) GL_ARB_compute_shader DONE (freedreno/a5xx+, i965/gen7+) - GL_ARB_draw_indirect DONE (freedreno, i965/gen7+, swr) + GL_ARB_draw_indirect DONE (freedreno, i965/gen7+, ) GL_ARB_explicit_uniform_location DONE (all drivers that support GLSL) GL_ARB_framebuffer_no_attachments DONE (freedreno, i965/gen7+, softpipe) GL_ARB_program_interface_query DONE (all drivers) - GL_ARB_shader_atomic_counters DONE (freedreno/a5xx+, i965/gen7+, swr) - GL_ARB_shader_image_load_store DONE (freedreno/a5xx+, i965/gen7+, swr) - GL_ARB_shader_image_size DONE (freedreno/a5xx+, i965/gen7+, swr) + GL_ARB_shader_atomic_counters DONE (freedreno/a5xx+, i965/gen7+, ) + GL_ARB_shader_image_load_store DONE (freedreno/a5xx+, i965/gen7+, ) + GL_ARB_shader_image_size DONE (freedreno/a5xx+, i965/gen7+, ) GL_ARB_shader_storage_buffer_object DONE (freedreno/a5xx+, i965/gen7+) GL_ARB_shading_language_packing DONE (all drivers) GL_ARB_separate_shader_objects DONE (all drivers) - GL_ARB_stencil_texturing DONE (freedreno, nv50, swr) - GL_ARB_texture_multisample (Multisample textures) DONE (freedreno/a5xx+, i965/gen7+, nv50, swr) + GL_ARB_stencil_texturing DONE (freedreno, nv50, ) + GL_ARB_texture_multisample (Multisample textures) DONE (freedreno/a5xx+, i965/gen7+, nv50, ) GL_ARB_texture_storage_multisample DONE (all drivers that support GL_ARB_texture_multisample) GL_ARB_vertex_attrib_binding DONE (all drivers) GS5 Enhanced textureGather DONE (freedreno, i965/gen7+) @@ -274,7 +274,7 @@ GLES3.2, GLSL ES 3.2 -- all DONE: i965/gen9+, radeonsi, virgl, llvmpipe, zink GL_KHR_blend_equation_advanced DONE (freedreno/a6xx, i965, nvc0, panfrost) GL_KHR_debug DONE (all drivers) GL_KHR_robustness DONE (freedreno, i965, nvc0, r600) - GL_KHR_texture_compression_astc_ldr DONE (freedreno, i965/gen9+, r600, v3d, vc4, panfrost, softpipe, swr, lima) + GL_KHR_texture_compression_astc_ldr DONE (freedreno, i965/gen9+, r600, v3d, vc4, panfrost, softpipe, lima) GL_OES_copy_image DONE (all drivers) GL_OES_draw_buffers_indexed DONE (all drivers that support GL_ARB_draw_buffers_blend) GL_OES_draw_elements_base_vertex DONE (all drivers) @@ -305,10 +305,10 @@ Khronos, ARB, and OES extensions that are not part of any OpenGL or OpenGL ES ve GL_ARB_post_depth_coverage DONE (i965, nvc0, radeonsi, llvmpipe, zink) GL_ARB_robustness_isolation not started GL_ARB_sample_locations DONE (nvc0, zink) - GL_ARB_seamless_cubemap_per_texture DONE (etnaviv/SEAMLESS_CUBE_MAP, freedreno, i965, nvc0, r600, radeonsi, softpipe, swr, virgl) + GL_ARB_seamless_cubemap_per_texture DONE (etnaviv/SEAMLESS_CUBE_MAP, freedreno, i965, nvc0, r600, radeonsi, softpipe, virgl) GL_ARB_shader_ballot DONE (i965/gen8+, nvc0, radeonsi, zink) GL_ARB_shader_clock DONE (i965/gen7+, nv50, nvc0, r600, radeonsi, virgl, zink) - GL_ARB_shader_stencil_export DONE (i965/gen9+, r600, radeonsi, softpipe, llvmpipe, swr, virgl, panfrost, zink) + GL_ARB_shader_stencil_export DONE (i965/gen9+, r600, radeonsi, softpipe, llvmpipe, virgl, panfrost, zink) GL_ARB_shader_viewport_layer_array DONE (i965/gen6+, nvc0, radeonsi, zink) GL_ARB_shading_language_include DONE GL_ARB_sparse_buffer DONE (radeonsi/CIK+, zink) @@ -317,7 +317,7 @@ Khronos, ARB, and OES extensions that are not part of any OpenGL or OpenGL ES ve GL_ARB_sparse_texture_clamp not started GL_ARB_texture_filter_minmax DONE (nvc0/gm200+, zink) GL_EXT_color_buffer_half_float DONE (freedreno, i965, iris, llvmpipe, nv50, nvc0, radeonsi, zink) - GL_EXT_depth_bounds_test DONE (i965/gen12+, nv50, nvc0, radeonsi, softpipe, swr, zink) + GL_EXT_depth_bounds_test DONE (i965/gen12+, nv50, nvc0, radeonsi, softpipe, zink) GL_EXT_memory_object DONE (radeonsi, i965/gen7+, llvmpipe) GL_EXT_memory_object_fd DONE (radeonsi, i965/gen7+, llvmpipe) GL_EXT_memory_object_win32 not started @@ -332,7 +332,7 @@ Khronos, ARB, and OES extensions that are not part of any OpenGL or OpenGL ES ve GL_EXT_texture_sRGB_R8 DONE (all drivers that support GLES 3.0+) GL_KHR_blend_equation_advanced_coherent DONE (i965/gen9+, panfrost) GL_KHR_texture_compression_astc_hdr DONE (i965/bxt, panfrost) - GL_KHR_texture_compression_astc_sliced_3d DONE (i965/gen9+, r600, radeonsi, panfrost, softpipe, swr, zink, lima) + GL_KHR_texture_compression_astc_sliced_3d DONE (i965/gen9+, r600, radeonsi, panfrost, softpipe, zink, lima) GL_OES_depth_texture_cube_map DONE (all drivers that support GLSL 1.30+) GL_OES_EGL_image DONE (all drivers) GL_OES_EGL_image_external DONE (all drivers) @@ -340,11 +340,11 @@ Khronos, ARB, and OES extensions that are not part of any OpenGL or OpenGL ES ve GL_OES_required_internalformat DONE (all drivers) GL_OES_surfaceless_context DONE (all drivers) GL_OES_texture_compression_astc DONE (core only) - GL_OES_texture_float DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, swr, zink) - GL_OES_texture_float_linear DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, swr, zink) - GL_OES_texture_half_float DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, swr, zink, lima) - GL_OES_texture_half_float_linear DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, swr, zink, lima) - GL_OES_texture_view DONE (freedreno, i965/gen8+, r600, radeonsi, nv50, nvc0, softpipe, llvmpipe, swr, v3d, zink) + GL_OES_texture_float DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, zink) + GL_OES_texture_float_linear DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, zink) + GL_OES_texture_half_float DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, zink, lima) + GL_OES_texture_half_float_linear DONE (freedreno, i965, r300, r600, radeonsi, nv30, nv50, nvc0, softpipe, llvmpipe, panfrost, zink, lima) + GL_OES_texture_view DONE (freedreno, i965/gen8+, r600, radeonsi, nv50, nvc0, softpipe, llvmpipe, v3d, zink) GL_OES_viewport_array DONE (i965, nvc0, r600, radeonsi, softpipe, zink) GLX_ARB_context_flush_control not started GLX_ARB_robustness_application_isolation not started diff --git a/docs/history.rst b/docs/history.rst index 276f2a52f07..3c167f54a4d 100644 --- a/docs/history.rst +++ b/docs/history.rst @@ -88,8 +88,7 @@ Ongoing: Mesa is the OpenGL implementation for devices designed by Intel, AMD, NVIDIA, Qualcomm, Broadcom, Vivante, plus the VMware and VirGL virtual GPUs. There's also several software-based renderers: swrast (the legacy Mesa rasterizer), softpipe (a Gallium reference -driver), llvmpipe (LLVM/JIT-based high-speed rasterizer) and swr -(another LLVM-based driver). +driver) and llvmpipe (LLVM/JIT-based high-speed rasterizer). Work continues on the drivers and core Mesa to implement newer versions of the OpenGL, OpenGL ES and Vulkan specifications. diff --git a/docs/index.rst b/docs/index.rst index 1cad5402dc9..2335981112e 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -87,7 +87,6 @@ Linux, FreeBSD, and other operating systems. drivers/freedreno drivers/lima drivers/llvmpipe - drivers/openswr drivers/panfrost drivers/svga3d drivers/v3d diff --git a/docs/meson.rst b/docs/meson.rst index d19bb94e35a..2baeec81a85 100644 --- a/docs/meson.rst +++ b/docs/meson.rst @@ -296,7 +296,6 @@ The wrap file must define the following: It may also define: - ``irbuilder_h``: a ``files()`` object pointing to llvm/IR/IRBuilder.h - (this is required for SWR) - ``has_rtti``: a ``bool`` that declares whether LLVM was built with RTTI. Defaults to true diff --git a/docs/sourcetree.rst b/docs/sourcetree.rst index 958fe51d7e5..e331232793f 100644 --- a/docs/sourcetree.rst +++ b/docs/sourcetree.rst @@ -121,7 +121,6 @@ each directory. - **radeonsi** - Driver for AMD Southern Island and newer (GCN, RDNA). - **softpipe** - Software reference driver. - **svga** - Driver for VMware's SVGA virtual GPU. - - **swr** - Software driver with massively parellel vertex processing. - **tegra** - Driver for NVIDIA Tegra GPUs. - **v3d** - Driver for Broadcom VideoCore 5 and newer. - **vc4** - Driver for Broadcom VideoCore 4. diff --git a/docs/systems.rst b/docs/systems.rst index dd253511962..dd057409c32 100644 --- a/docs/systems.rst +++ b/docs/systems.rst @@ -42,8 +42,6 @@ Software drivers include: - :doc:`LLVMpipe ` - uses LLVM for x86 JIT code generation and is multi-threaded - Softpipe - a reference Gallium driver -- :doc:`OpenSWR ` - x86-optimized software renderer - for visualization workloads Additional driver information: