{"id":148,"date":"2024-06-18T21:01:39","date_gmt":"2024-06-18T13:01:39","guid":{"rendered":"http:\/\/chenglixue.top\/?p=148"},"modified":"2024-07-03T23:36:51","modified_gmt":"2024-07-03T15:36:51","slug":"unity-group-shared-memory%e5%8a%a0%e9%80%9f%e9%ab%98%e6%96%af%e6%a8%a1%e7%b3%8a","status":"publish","type":"post","link":"http:\/\/chenglixue.top\/?p=148","title":{"rendered":"Unity Group Shared Memory\u52a0\u901f\u9ad8\u65af\u6a21\u7cca"},"content":{"rendered":"<p><div class=\"has-toc have-toc\"><\/div><\/p>\n<h1>\u4e3a\u4ec0\u4e48\u4f7f\u7528Compute Shader\u8ba1\u7b97\u9ad8\u65af\u6a21\u7cca<\/h1>\n<p>\u5728\u8ba1\u7b97\u9ad8\u65af\u6a21\u7cca\u65f6\uff0c\u56e0\u4e3a\u8ba1\u7b97\u5377\u79ef\u7684\u5173\u7cfb\uff0c\u4f1a\u91cd\u590d\u91c7\u6837\u4e0d\u5c11\u50cf\u7d20\uff0c\u6240\u4ee5\u8fd9\u4e00\u671f\u95f4\u6548\u7387\u662f\u5f88\u4f4e\u7684\u3002\u800c\u5728GPU\u4e2d\u6709\u4e2a\u73a9\u610f\u53eb\u505a\u5171\u4eab\u5185\u5b58\uff0c\u7ebf\u7a0b\u8bbf\u95ee\u5171\u4eab\u5185\u5b58\u7684\u6548\u7387\u662f\u8fdc\u8fdc\u9ad8\u4e8e\u91c7\u6837\u8d34\u56fe\u7684\u6548\u7387\u7684\uff0c\u56e0\u6b64\u672c\u6587\u5c06\u4ecb\u7ecd\u5982\u4f55\u5728Compute Shader\u4f7f\u7528Group Shared Memory\u52a0\u901f\u9ad8\u65af\u6a21\u7cca<\/p>\n<h1>\u5b9e\u73b0\u6b65\u9aa4<\/h1>\n<ul>\n<li>\u5b9e\u73b0\u9ad8\u65af\u6a21\u7cca\u7684\u57fa\u672c\u6b65\u9aa4\u8fd9\u91cc\u5c31\u4e0d\u7ec6\u8bf4\u4e86\uff0c\u91cd\u70b9\u4ecb\u7ecd\u5982\u4f55\u52a0\u901f\uff0c\u53ca\u52a0\u901f\u9700\u6ce8\u610f\u7684\u7ec6\u8282<\/p>\n<\/li>\n<li>\n<p>\u867d\u7136Group Shared Memory\u4f1a\u5b58\u50a8\u8d34\u56fe\u4fe1\u606f\uff0c\u4f46\u5b83\u7684\u5927\u5c0f\u662f\u6709\u9650\u7684\uff0c\u56e0\u6b64\u8fd9\u91cc\u9700\u8981\u8003\u8651\u6700\u5927\u7684\u6a21\u7cca\u534a\u5f84\uff08\u56e0\u4e3a\u6a21\u7cca\u534a\u5f84\u8d8a\u5927\uff0c\u9700\u8981\u7684Group Shared Memory\u4e5f\u8d8a\u5927\uff09\uff0c\u8fd9\u91cc\u8bbe\u6700\u5927\u6a21\u7cca\u534a\u5f84MAX_RADIUS\u4e3a32<\/p>\n<\/li>\n<li>\n<p>\u5728Compute Shader\u91c7\u6837\uff0c\u53ef\u4ee5\u628a\u6bcf\u4e2a\u7ebf\u7a0b\u7406\u89e3\u4e3ascreen space uv\uff0c\u90a3\u4e48\u5728\u6a21\u7cca\u8fb9\u754c\u65f6\uff0c\u7531\u4e8e\u6a21\u7cca\u534a\u5f84_BlurRadius\u7684\u5f71\u54cd\uff0c\u7ebf\u7a0b\u4f1a\u53ef\u80fd\u8d8a\u754c\u3002\u56e0\u6b64<strong>Group Shared Memory\u5f00\u8f9f\u7684\u5927\u5c0f\u5e94\u662f\u7ebf\u7a0b\u6570 + 2 * _BlurRadius<\/strong><br \/>\n<img decoding=\"async\"   class=\"lazyload\" data-src=\"https:\/\/pic.imgdb.cn\/item\/666be7d5d9c307b7e97ca5fb.png\" src=\"https:\/\/cdn.jsdelivr.net\/gh\/moezx\/cdn@3.0.2\/img\/svg\/loader\/trans.ajax-spinner-preloader.svg\" onerror=\"imgError(this)\"  alt=\"\" \/><\/p >\n<noscript><img decoding=\"async\" src=\"https:\/\/pic.imgdb.cn\/item\/666be7d5d9c307b7e97ca5fb.png\" alt=\"\" \/><\/p><\/noscript>\n<p>\u5728\u5b9e\u73b0\u65f6\u8fd8\u9700\u8981\u6ce8\u610f\u5904\u7406\u8d8a\u754c\u95ee\u9898\uff08\u91c7\u6837\u5b58\u50a8\u7ebf\u7a0b\u7ec4\u5916\u7684\u8d34\u56fe\u4fe1\u606f\uff09\uff0c\u8d8a\u754c\u540e\u91c7\u6837\u60c5\u51b5\u5982\u4e0b\uff1a<br \/>\n<img decoding=\"async\"   class=\"lazyload\" data-src=\"https:\/\/pic.imgdb.cn\/item\/666bee92d9c307b7e98a1147.png\" src=\"https:\/\/cdn.jsdelivr.net\/gh\/moezx\/cdn@3.0.2\/img\/svg\/loader\/trans.ajax-spinner-preloader.svg\" onerror=\"imgError(this)\"  alt=\"\" \/><\/p >\n<noscript><img decoding=\"async\" src=\"https:\/\/pic.imgdb.cn\/item\/666bee92d9c307b7e98a1147.png\" alt=\"\" \/><\/p><\/noscript>\n<\/li>\n<li>\n<p>\u4e3a\u4e86\u4f18\u5316\u9ad8\u65af\u6a21\u7cca\uff0c\u5e38\u89c1\u7684\u662f\u5c06\u4e8c\u7ef4\u9ad8\u65af\u6a21\u7cca\u62c6\u5206\u6210\u4e24\u4e2a\u4e00\u7ef4\u7684\uff0c\u6c34\u5e73\u7ad6\u76f4\u7684\u90fd\u6a21\u7cca\u4e00\u6b21\uff1b\u672c\u6587\u5728\u6b64\u57fa\u7840\u4e0a\u8fd8\u901a\u8fc7<strong>\u7ebf\u6027\u63d2\u503c<\/strong>\u7684\u624b\u7b14\u8fdb\u4e00\u6b65\u4f18\u5316\uff0c\u4ee5\u53ca\u964d\u4f4e\u56fe\u7247\u5206\u8fa8\u7387\u540e\u518d\u6a21\u7cca\uff0c\u6700\u540e\u8fd8\u539f\u5206\u8fa8\u7387\u7684\u65b9\u6cd5<\/p>\n<\/li>\n<\/ul>\n<h1>\u5b9e\u73b0<\/h1>\n<pre><code class=\"line-numbers\">#include \"Packages\/com.unity.render-pipelines.core\/ShaderLibrary\/Common.hlsl\"\n\n#pragma region Kernel\n\n#pragma kernel GaussianBlurHorizontalMain\n#pragma kernel GaussianBlurVerticalMain\n\n#pragma endregion\n\n#pragma region Declaration\n\nfloat _BlurRadius;\nfloat4 _ViewSize;\n\nTexture2D&lt;float4&gt; _InputTex;\nRWTexture2D&lt;float4&gt; _OutputTex;\n\nstatic const float Gaussian17[] =\n{\n    0.00002611081194810,\n    0.00021522769030413,\n    0.00133919168719865,\n    0.00628987509902766,\n    0.02229954363469697,\n    0.05967667338326389,\n    0.12055019394312867,\n    0.18381709484250766,\n    0.21157217927735517,\n    0.18381709484250766,\n    0.12055019394312867,\n    0.05967667338326389,\n    0.02229954363469697,\n    0.00628987509902766,\n    0.00133919168719865,\n    0.00021522769030413,\n    0.00002611081194810,\n};\n\n\/\/ groupshared\u7684\u5927\u5c0f\u6709\u6240\u9650\u5236, \u8fd9\u91cc\u8bbe\u7f6e\u6a21\u7cca\u6838\u534a\u5f84\u4e3a32\n#define MAX_RADIUS 32\n\n\/\/ \u6a21\u7cca\u4f1a\u91c7\u6837\u76ee\u6807\u50cf\u7d20\u70b9\u4e24\u4fa7\u7684\u50cf\u7d20, \u56e0\u6b64groupshared\u4e0d\u4ec5\u4ec5\u9700\u8981\u4fdd\u5b58threads, \u8fd8\u9700\u8981\u4fdd\u5b58\u989d\u5916\u7684\u56fe\u50cf\u6570\u636e\ngroupshared float3 GS_Color[64 + 2 * MAX_RADIUS];\n\n#pragma endregion\n\n[numthreads(64,1,1)]\nvoid GaussianBlurHorizontalMain (uint3 groupID : SV_GroupID, uint groupIndex : SV_GroupIndex, uint3 dispatchThreadID : SV_DispatchThreadID)\n{\n    int2 currPos = dispatchThreadID.xy;\n    int2 tempPos = clamp(currPos, 0, _ViewSize.xy - 1);\n    GS_Color[groupIndex + MAX_RADIUS] = _InputTex.Load(uint3(tempPos, 0)).rgb;  \/\/ \u5c06\u6570\u636e\u4ece\u5168\u5c40\u5185\u5b58\uff08GPU\u7684\u4e3b\u5185\u5b58\uff09\u52a0\u8f7d\u5230\u5171\u4eab\u5185\u5b58\u4e2d\n\n    if(groupIndex &lt; MAX_RADIUS)\n    {\n        int2 clampPos = max(tempPos - int2(MAX_RADIUS, 0), 0);\n        GS_Color[groupIndex] = _InputTex.Load(uint3(clampPos, 0)).rgb;\n    }\n    if(groupIndex &gt;= 64 - MAX_RADIUS)\n    {\n        int2 clampPos = min(tempPos + int2(MAX_RADIUS, 0), _ViewSize.xy - 1);\n        GS_Color[groupIndex + 2 * MAX_RADIUS] = _InputTex.Load(uint3(clampPos, 0)).rgb;\n    }\n    GroupMemoryBarrierWithGroupSync();  \/\/ \u7ebf\u7a0b\u540c\u6b65\n\n    float3 blurColor = 0.f;\n    UNITY_UNROLL\n    for(uint i = 0; i &lt; 17; ++i)\n    {\n        float weight = Gaussian17[i];\n\n        float offset = ((float)i - 8) * _BlurRadius * 0.125;\n        int floorOffset = floor(offset);\n        float lerpValue = offset - floorOffset;\n        float3 sampleColorFloor = GS_Color[groupIndex + floorOffset + MAX_RADIUS];\n        float3 sampleColorCeil  = GS_Color[groupIndex + floorOffset + MAX_RADIUS + 1];\n        float3 sampleColor = lerp(sampleColorFloor, sampleColorCeil, lerpValue);\n        blurColor += sampleColor * weight;\n    }\n\n    _OutputTex[dispatchThreadID.xy] = float4(blurColor, 1.f);\n}\n\n[numthreads(1,64,1)]\nvoid GaussianBlurVerticalMain (uint3 groupID : SV_GroupID, uint groupIndex : SV_GroupIndex, uint3 dispatchThreadID : SV_DispatchThreadID)\n{\n    int2 currPos = dispatchThreadID.xy;\n    int2 tempPos = clamp(currPos, 0, _ViewSize.xy - 1);\n    GS_Color[groupIndex + MAX_RADIUS] = _InputTex.Load(uint3(tempPos, 0)).rgb;\n\n    if(groupIndex &lt; MAX_RADIUS)\n    {\n        int2 clampPos = max(tempPos - uint2(0, MAX_RADIUS), 0);\n        GS_Color[groupIndex] = _InputTex.Load(uint3(clampPos, 0)).rgb;\n    }\n\n    if(groupIndex &gt;= 64 - MAX_RADIUS)\n    {\n        int2 clampPos = min(tempPos + uint2(0, MAX_RADIUS), _ViewSize.xy - 1);\n        GS_Color[groupIndex + 2 * MAX_RADIUS] = _InputTex.Load(uint3(clampPos, 0)).rgb;\n    }\n    GroupMemoryBarrierWithGroupSync();\n\n    float3 blurColor = 0.f;\n    UNITY_UNROLL\n    for(uint i = 0; i &lt; 17; ++i)\n    {\n        float weight = Gaussian17[i];\n\n        float offset = ((float)i - 8) * 0.125f * _BlurRadius;\n        int offsetFloor = floor(offset);\n        float lerpValue = offset - offsetFloor;\n\n        float3 sampleColorFloor = GS_Color[groupIndex + MAX_RADIUS + offsetFloor];\n        float3 sampleColorCeil = GS_Color[groupIndex + MAX_RADIUS + offsetFloor + 1];\n        float3 sampleColor = lerp(sampleColorFloor, sampleColorCeil, lerpValue);\n\n        blurColor += sampleColor * weight;\n    }\n\n    _OutputTex[dispatchThreadID.xy] = float4(blurColor, 1.f);\n}\n<\/code><\/pre>\n<h1>\u540e\u7eed<\/h1>\n<p>\u76ee\u524d\u8fd9\u4e2a\u9ad8\u65af\u6a21\u7cca\u8fd8\u5b58\u5728\u4e00\u5b9a\u95ee\u9898\uff0c\u5b83\u7684\u6743\u91cd\u8303\u56f4\u662f\u56fa\u5b9a\u7684\uff0c\u540e\u7eed\u8fd8\u9700\u8003\u8651\u5982\u4f55\u4f18\u5316\uff0c\u4e0d\u8fc7\u4f1a\u653e\u7f6e\u4e00\u6bb5\u65f6\u95f4\uff0c\u5148\u5199TAA\uff01<\/p>\n<h1>Reference<\/h1>\n<p><a class=\"wp-editor-md-post-content-link\" href=\"https:\/\/www.cnblogs.com\/X-Jun\/p\/12309749.html\" target=\"_blank\"  rel=\"nofollow\" >DirectX11 With Windows SDK--30 \u8ba1\u7b97\u7740\u8272\u5668\uff1a\u9ad8\u65af\u6a21\u7cca\u3001\u7d22\u8d1d\u5c14\u7b97\u5b50<\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u4e3a\u4ec0\u4e48\u4f7f\u7528Compute Shader\u8ba1\u7b97\u9ad8\u65af\u6a21\u7cca \u5728\u8ba1\u7b97\u9ad8\u65af\u6a21\u7cca\u65f6\uff0c\u56e0\u4e3a\u8ba1\u7b97\u5377\u79ef\u7684\u5173\u7cfb\uff0c\u4f1a\u91cd\u590d\u91c7\u6837\u4e0d\u5c11\u50cf\u7d20\uff0c\u6240\u4ee5\u8fd9\u4e00\u671f\u95f4\u6548\u7387\u662f\u5f88 &#8230;<\/p>","protected":false},"author":1,"featured_media":24,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[3],"tags":[],"_links":{"self":[{"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/posts\/148"}],"collection":[{"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/chenglixue.top\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=148"}],"version-history":[{"count":2,"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/posts\/148\/revisions"}],"predecessor-version":[{"id":177,"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/posts\/148\/revisions\/177"}],"wp:featuredmedia":[{"embeddable":true,"href":"http:\/\/chenglixue.top\/index.php?rest_route=\/wp\/v2\/media\/24"}],"wp:attachment":[{"href":"http:\/\/chenglixue.top\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=148"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/chenglixue.top\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=148"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/chenglixue.top\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=148"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}