-
Notifications
You must be signed in to change notification settings - Fork 824
/
Copy pathNativePassCompiler.cs
1481 lines (1288 loc) · 74.1 KB
/
NativePassCompiler.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
using System;
using System.Diagnostics;
using System.Collections.Generic;
using Unity.Collections;
using Unity.Collections.LowLevel.Unsafe;
using UnityEngine.Rendering;
namespace UnityEngine.Rendering.RenderGraphModule.NativeRenderPassCompiler
{
internal partial class NativePassCompiler : IDisposable
{
internal struct RenderGraphInputInfo
{
public RenderGraphResourceRegistry m_ResourcesForDebugOnly;
public List<RenderGraphPass> m_RenderPasses;
public string debugName;
public bool disableCulling;
}
internal RenderGraphInputInfo graph;
internal CompilerContextData contextData = null;
internal CompilerContextData defaultContextData;
internal CommandBuffer previousCommandBuffer;
Stack<int> toVisitPassIds;
RenderGraphCompilationCache m_CompilationCache;
internal const int k_EstimatedPassCount = 100;
internal const int k_MaxSubpass = 8; // Needs to match with RenderPassSetup.h
NativeList<AttachmentDescriptor> m_BeginRenderPassAttachments;
public NativePassCompiler(RenderGraphCompilationCache cache)
{
m_CompilationCache = cache;
defaultContextData = new CompilerContextData(k_EstimatedPassCount);
toVisitPassIds = new Stack<int>(k_EstimatedPassCount);
m_BeginRenderPassAttachments = new NativeList<AttachmentDescriptor>(FixedAttachmentArray<AttachmentDescriptor>.MaxAttachments, Allocator.Persistent);
}
// IDisposable implementation
bool m_Disposed;
~NativePassCompiler() => Cleanup();
public void Dispose()
{
Cleanup();
GC.SuppressFinalize(this);
}
void Cleanup()
{
if (!m_Disposed)
{
m_BeginRenderPassAttachments.Dispose();
m_Disposed = true;
}
}
public bool Initialize(RenderGraphResourceRegistry resources, List<RenderGraphPass> renderPasses, bool disableCulling, string debugName, bool useCompilationCaching, int graphHash, int frameIndex)
{
bool cached = false;
if (!useCompilationCaching)
contextData = defaultContextData;
else
cached = m_CompilationCache.GetCompilationCache(graphHash, frameIndex, out contextData);
graph.m_ResourcesForDebugOnly = resources;
graph.m_RenderPasses = renderPasses;
graph.disableCulling = disableCulling;
graph.debugName = debugName;
Clear(clearContextData: !useCompilationCaching);
return cached;
}
public void Compile(RenderGraphResourceRegistry resources)
{
SetupContextData(resources);
BuildGraph();
CullUnusedRenderPasses();
TryMergeNativePasses();
FindResourceUsageRanges();
DetectMemoryLessResources();
PrepareNativeRenderPasses();
}
public void Clear(bool clearContextData)
{
if (clearContextData)
contextData.Clear();
toVisitPassIds.Clear();
}
void SetPassStatesForNativePass(int nativePassId)
{
NativePassData.SetPassStatesForNativePass(contextData, nativePassId);
}
internal enum NativeCompilerProfileId
{
NRPRGComp_PrepareNativePass,
NRPRGComp_SetupContextData,
NRPRGComp_BuildGraph,
NRPRGComp_CullNodes,
NRPRGComp_TryMergeNativePasses,
NRPRGComp_FindResourceUsageRanges,
NRPRGComp_DetectMemorylessResources,
NRPRGComp_ExecuteCreateResources,
NRPRGComp_ExecuteBeginRenderpassCommand,
NRPRGComp_ExecuteDestroyResources,
}
void SetupContextData(RenderGraphResourceRegistry resources)
{
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_SetupContextData)))
{
contextData.Initialize(resources);
}
}
void BuildGraph()
{
var ctx = contextData;
List<RenderGraphPass> passes = graph.m_RenderPasses;
// Not clearing data, we will do it right after in the for loop
// This is to prevent unnecessary costly copies of pass struct (128bytes)
ctx.passData.ResizeUninitialized(passes.Count);
// Build up the context graph and keep track of nodes we encounter that can't be culled
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_BuildGraph)))
{
for (int passId = 0; passId < passes.Count; passId++)
{
var inputPass = passes[passId];
#if DEVELOPMENT_BUILD || UNITY_EDITOR
if (inputPass.type == RenderGraphPassType.Legacy)
{
throw new Exception("Pass '" + inputPass.name + "' is using the legacy rendergraph API." +
" You cannot use legacy passes with the native render pass compiler." +
" Please do not use AddPass on the rendergrpah but use one of the more specific pass types such as AddRasterRenderPass");
}
#endif
// Accessing already existing passData in place in the container through reference to avoid deep copy
// Make sure everything is reset and initialized or we will use obsolete data from previous frame
ref var ctxPass = ref ctx.passData.ElementAt(passId);
ctxPass.ResetAndInitialize(inputPass, passId);
ctx.passNames.Add(new Name(inputPass.name, true));
if (ctxPass.hasSideEffects)
{
toVisitPassIds.Push(passId);
}
// Set up the list of fragment attachments for this pass
// Note: This doesn't set up the resource reader/writer list as the fragment attachments
// will also be in the pass read/write lists accordingly
if (ctxPass.type == RenderGraphPassType.Raster)
{
// Grab offset in context fragment list to begin building the fragment list
ctxPass.firstFragment = ctx.fragmentData.Length;
// Depth attachment is always at index 0
if (inputPass.depthAccess.textureHandle.handle.IsValid())
{
ctxPass.fragmentInfoHasDepth = true;
if (ctx.AddToFragmentList(inputPass.depthAccess, ctxPass.firstFragment, ctxPass.numFragments))
{
ctxPass.AddFragment(inputPass.depthAccess.textureHandle.handle, ctx);
}
}
for (var ci = 0; ci < inputPass.colorBufferMaxIndex + 1; ++ci)
{
// Skip unused color slots
if (!inputPass.colorBufferAccess[ci].textureHandle.handle.IsValid()) continue;
if (ctx.AddToFragmentList(inputPass.colorBufferAccess[ci], ctxPass.firstFragment, ctxPass.numFragments))
{
ctxPass.AddFragment(inputPass.colorBufferAccess[ci].textureHandle.handle, ctx);
}
}
// Grab offset in context fragment list to begin building the fragment input list
ctxPass.firstFragmentInput = ctx.fragmentData.Length;
for (var ci = 0; ci < inputPass.fragmentInputMaxIndex + 1; ++ci)
{
// Skip unused fragment input slots
if (!inputPass.fragmentInputAccess[ci].textureHandle.IsValid()) continue;
var resource = inputPass.fragmentInputAccess[ci].textureHandle;
if (ctx.AddToFragmentList(inputPass.fragmentInputAccess[ci], ctxPass.firstFragmentInput, ctxPass.numFragmentInputs))
{
ctxPass.AddFragmentInput(inputPass.fragmentInputAccess[ci].textureHandle.handle, ctx);
}
}
// Grab offset in context random write list to begin building the per pass random write lists
ctxPass.firstRandomAccessResource = ctx.randomAccessResourceData.Length;
for (var ci = 0; ci < passes[passId].randomAccessResourceMaxIndex + 1; ++ci)
{
ref var uav = ref passes[passId].randomAccessResource[ci];
// Skip unused random write slots
if (!uav.h.IsValid()) continue;
if (ctx.AddToRandomAccessResourceList(uav.h, ci, uav.preserveCounterValue, ctxPass.firstRandomAccessResource, ctxPass.numRandomAccessResources))
{
ctxPass.AddRandomAccessResource();
}
}
// This is suspicious, there are frame buffer fetch inputs but nothing is output. We don't allow this for now.
// In theory you could fb-fetch inputs and write something to a uav and output nothing? This needs to be investigated
// so don't allow it for now.
if (ctxPass.numFragments == 0)
{
Debug.Assert(ctxPass.numFragmentInputs == 0);
}
}
// Set up per resource type read/write lists for this pass
ctxPass.firstInput = ctx.inputData.Length; // Grab offset in context input list
ctxPass.firstOutput = ctx.outputData.Length; // Grab offset in context output list
for (int type = 0; type < (int)RenderGraphResourceType.Count; ++type)
{
var resourceWrite = inputPass.resourceWriteLists[type];
var resourceWriteCount = resourceWrite.Count;
for (var i = 0; i < resourceWriteCount; ++i)
{
var resource = resourceWrite[i];
// Writing to an imported resource is a side effect so mark the pass if needed
ref var resData = ref ctx.UnversionedResourceData(resource);
if (resData.isImported)
{
if (ctxPass.hasSideEffects == false)
{
ctxPass.hasSideEffects = true;
toVisitPassIds.Push(passId);
}
}
// Mark this pass as writing to this version of the resource
ctx.resources[resource].SetWritingPass(ctx, resource, passId);
ctx.outputData.Add(new PassOutputData
{
resource = resource,
});
ctxPass.numOutputs++;
}
var resourceRead = inputPass.resourceReadLists[type];
var resourceReadCount = resourceRead.Count;
for (var i = 0; i < resourceReadCount; ++i)
{
var resource = resourceRead[i];
// Mark this pass as reading from this version of the resource
ctx.resources[resource].RegisterReadingPass(ctx, resource, passId, ctxPass.numInputs);
ctx.inputData.Add(new PassInputData
{
resource = resource,
});
ctxPass.numInputs++;
}
var resourceTrans = inputPass.transientResourceList[type];
var resourceTransCount = resourceTrans.Count;
for (var i = 0; i < resourceTransCount; ++i)
{
var resource = resourceTrans[i];
// Mark this pass as reading from this version of the resource
ctx.resources[resource].RegisterReadingPass(ctx, resource, passId, ctxPass.numInputs);
ctx.inputData.Add(new PassInputData
{
resource = resource,
});
ctxPass.numInputs++;
// Mark this pass as writing to this version of the resource
ctx.resources[resource].SetWritingPass(ctx, resource, passId);
ctx.outputData.Add(new PassOutputData
{
resource = resource,
});
ctxPass.numOutputs++;
}
}
}
}
}
void CullUnusedRenderPasses()
{
var ctx = contextData;
// Source = input of the graph and starting point that takes no inputs itself : e.g. z-prepass
// Sink = output of the graph and end point e.g. rendered frame
// Usually sinks will have to be pinned or write to an external resource or the whole graph would get culled :-)
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_CullNodes)))
{
// No need to go further if we don't enable culling
if (graph.disableCulling)
return;
// Cull all passes first
ctx.CullAllPasses(true);
// Flood fill downstream algorithm using BFS,
// starting from the pinned nodes to all their dependencies
while (toVisitPassIds.Count != 0)
{
int passId = toVisitPassIds.Pop();
ref var passData = ref ctx.passData.ElementAt(passId);
// We already found this node through another dependency chain
if (!passData.culled) continue;
// Flow upstream from this node
foreach (ref readonly var input in passData.Inputs(ctx))
{
int inputPassIndex = ctx.resources[input.resource].writePassId;
toVisitPassIds.Push(inputPassIndex);
}
// We need this node, don't cull it
passData.culled = false;
}
// Update graph based on freshly culled nodes, remove any connection to them
var numPasses = ctx.passData.Length;
for (int passIndex = 0; passIndex < numPasses; passIndex++)
{
ref readonly var pass = ref ctx.passData.ElementAt(passIndex);
// Remove the connections from the list so they won't be visited again
if (pass.culled)
{
foreach (ref readonly var input in pass.Inputs(ctx))
{
var inputResource = input.resource;
ctx.resources[inputResource].RemoveReadingPass(ctx, inputResource, pass.passId);
}
}
}
}
}
void TryMergeNativePasses()
{
var ctx = contextData;
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_TryMergeNativePasses)))
{
// Try to merge raster passes into the currently active native pass. This will not do pass reordering yet
// so it is simply greedy trying to add the next pass to a currently active one.
// In the future we want to try adding any available (i.e. that has no data dependencies on any future results) future pass
// and allow merging that into the pass thus greedily reordering passes. But reordering requires a lot of API validation
// that ensures rendering behaves accordingly with reordered passes so we don't allow that for now.
// !!! Compilation caching warning !!!
// Merging of passes is highly dependent on render texture properties.
// When caching the render graph compilation, we hash a subset of those render texture properties to make sure we recompile the graph if needed.
// We only hash a subset for performance reason so if you add logic here that will change the behavior of pass merging,
// make sure that the relevant properties are hashed properly. See RenderGraphPass.ComputeHash()
int activeNativePassId = -1;
for (var passIdx = 0; passIdx < ctx.passData.Length; ++passIdx)
{
ref var passToAdd = ref ctx.passData.ElementAt(passIdx);
// If the pass has been culled, just ignore it
if (passToAdd.culled)
{
continue;
}
// If no active pass, there is nothing to merge...
if (activeNativePassId == -1)
{
//If raster, start a new native pass with the current pass
if (passToAdd.type == RenderGraphPassType.Raster)
{
// Allocate a stand-alone native renderpass based on the current pass
ctx.nativePassData.Add(new NativePassData(ref passToAdd, ctx));
passToAdd.nativePassIndex = ctx.nativePassData.LastIndex();
activeNativePassId = passToAdd.nativePassIndex;
}
}
// There is an native pass currently open, try to add the current graph pass to it
else
{
var mergeTestResult = NativePassData.TryMerge(contextData, activeNativePassId, passIdx);
// Merge failed, close current native render pass and create a new one
if (mergeTestResult.reason != PassBreakReason.Merged)
{
SetPassStatesForNativePass(activeNativePassId);
#if UNITY_EDITOR
ref var nativePassData = ref contextData.nativePassData.ElementAt(activeNativePassId);
nativePassData.breakAudit = mergeTestResult;
#endif
if (mergeTestResult.reason == PassBreakReason.NonRasterPass)
{
// Non-raster pass, no active native pass at all
activeNativePassId = -1;
}
else
{
// Raster but cannot be merged, allocate a new stand-alone native renderpass based on the current pass
ctx.nativePassData.Add(new NativePassData(ref passToAdd, ctx));
passToAdd.nativePassIndex = ctx.nativePassData.LastIndex();
activeNativePassId = passToAdd.nativePassIndex;
}
}
}
}
if (activeNativePassId >= 0)
{
// "Close" the last native pass by marking the last graph pass as end
SetPassStatesForNativePass(activeNativePassId);
#if UNITY_EDITOR
ref var nativePassData = ref contextData.nativePassData.ElementAt(activeNativePassId);
nativePassData.breakAudit = new PassBreakAudit(PassBreakReason.EndOfGraph, -1);
#endif
}
}
}
void FindResourceUsageRanges()
{
var ctx = contextData;
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_FindResourceUsageRanges)))
{
// Find the passes that last use a resource
// First do a forward-pass increasing the refcount
// followed by another forward-pass decreasing it again (-> if we get 0, we must be the last ones using it)
// TODO: I have a feeling this can be done more optimally by walking the graph instead of looping over all the passes twice
// to be investigated
// It also won't work if we start reordering passes.
for (int passIndex = 0; passIndex < ctx.passData.Length; passIndex++)
{
ref var pass = ref ctx.passData.ElementAt(passIndex);
if (pass.culled)
continue;
// Loop over all the resources this pass needs (=inputs)
foreach (ref readonly var input in pass.Inputs(ctx))
{
var inputResource = input.resource;
ref var pointTo = ref ctx.UnversionedResourceData(inputResource);
pointTo.lastUsePassID = -1;
// If we use version 0 and nobody else is using it yet,
// mark this pass as the first using the resource.
// It can happen that two passes use v0, e.g.:
// pass1.UseTex(v0,Read) -> this will clear the pass but keep it at v0
// pass2.UseTex(v0,Read) -> "reads" v0
if (inputResource.version == 0)
{
if (pointTo.firstUsePassID < 0)
{
pointTo.firstUsePassID = pass.passId;
pass.AddFirstUse(inputResource, ctx);
}
}
// This pass uses the last version of a resource increase the ref count of this resource
var last = pointTo.latestVersionNumber;
if (last == inputResource.version)
{
pointTo.tag++; //Refcount of how many passes are using the last version of a resource
}
}
//Also look at outputs (but with version 1) for edge case were we do a Write (but no read) to a texture and the pass is manually excluded from culling
//As it isn't read it won't be in the inputs array with V0
foreach (ref readonly var output in pass.Outputs(ctx))
{
var outputResource = output.resource;
ref var pointTo = ref ctx.UnversionedResourceData(outputResource);
if (outputResource.version == 1)
{
// If we use version 0 and nobody else is using it yet,
// Mark this pass as the first using the resource.
// It can happen that two passes use v0, e.g.:
// pass1.UseTex(v0,Read) -> this will clear the pass but keep it at v0
// pass3.UseTex(v0,Read/Write) -> wites v0, brings it to v1 from here on
if (pointTo.firstUsePassID < 0)
{
pointTo.firstUsePassID = pass.passId;
pass.AddFirstUse(outputResource, ctx);
}
}
// This pass outputs the last version of a resource track that
var last = pointTo.latestVersionNumber;
if (last == outputResource.version)
{
Debug.Assert(pointTo.lastWritePassID == -1); // Only one can be the last writer
pointTo.lastWritePassID = pass.passId;
}
}
}
for (int passIndex = 0; passIndex < ctx.passData.Length; passIndex++)
{
ref var pass = ref ctx.passData.ElementAt(passIndex);
if (pass.culled)
continue;
pass.waitOnGraphicsFencePassId = -1;
pass.insertGraphicsFence = false;
foreach (ref readonly var input in pass.Inputs(ctx))
{
var inputResource = input.resource;
ref var pointTo = ref ctx.UnversionedResourceData(inputResource);
var last = pointTo.latestVersionNumber;
if (last == inputResource.version)
{
var refC = pointTo.tag - 1;//Decrease refcount this pass is done using it
if (refC == 0)// We're the last pass done using it, this pass should destroy it.
{
pointTo.lastUsePassID = pass.passId;
pass.AddLastUse(inputResource, ctx);
}
pointTo.tag = refC;
}
// Resolve if this pass needs to wait on a fence due to its inputs
if (pass.waitOnGraphicsFencePassId == -1)
{
ref var pointToVer = ref ctx.VersionedResourceData(inputResource);
ref var wPass = ref ctx.passData.ElementAt(pointToVer.writePassId);
if (wPass.asyncCompute != pass.asyncCompute)
{
pass.waitOnGraphicsFencePassId = wPass.passId;
}
}
}
// We're outputting a resource that is never used.
// This can happen if this pass has multiple outputs and only a portion of them are used
// as some are used, the whole pass is not culled but the unused output still should be freed
foreach (ref readonly var output in pass.Outputs(ctx))
{
var outputResource = output.resource;
ref var pointTo = ref ctx.UnversionedResourceData(outputResource);
ref var pointToVer = ref ctx.VersionedResourceData(outputResource);
var last = pointTo.latestVersionNumber;
if (last == outputResource.version && pointToVer.numReaders == 0)
{
pointTo.lastUsePassID = pass.passId;
pass.AddLastUse(outputResource, ctx);
}
// Resolve if this pass should insert a fence for its outputs
var numReaders = pointToVer.numReaders;
for (var i = 0; i < numReaders; ++i)
{
var depIdx = ctx.resources.IndexReader(outputResource, i);
ref var dep = ref ctx.resources.readerData[outputResource.iType].ElementAt(depIdx);
ref var depPass = ref ctx.passData.ElementAt(dep.passId);
if (pass.asyncCompute != depPass.asyncCompute)
{
pass.insertGraphicsFence = true;
break;
}
}
}
}
}
}
void PrepareNativeRenderPasses()
{
// Prepare all native render pass execution info:
for (var passIdx = 0; passIdx < contextData.nativePassData.Length; ++passIdx)
{
ref var nativePassData = ref contextData.nativePassData.ElementAt(passIdx);
DetermineLoadStoreActions(ref nativePassData);
}
}
static bool IsGlobalTextureInPass(RenderGraphPass pass, ResourceHandle handle)
{
foreach (var g in pass.setGlobalsList)
{
if (g.Item1.handle.index == handle.index)
{
return true;
}
}
return false;
}
void DetectMemoryLessResources()
{
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_DetectMemorylessResources)))
{
// Native renderpasses and create/destroy lists have now been set-up. Detect memoryless resources, i.e resources that are created/destroyed
// within the scope of an nrp
foreach (ref readonly var nativePass in contextData.NativePasses)
{
// Loop over all created resources by this nrp
var graphPasses = nativePass.GraphPasses(contextData);
foreach (ref readonly var subPass in graphPasses)
{
foreach (ref readonly var createdRes in subPass.FirstUsedResources(contextData))
{
ref var createInfo = ref contextData.UnversionedResourceData(createdRes);
if (createdRes.type == RenderGraphResourceType.Texture && createInfo.isImported == false)
{
bool isGlobal = IsGlobalTextureInPass(graph.m_RenderPasses[subPass.passId], createdRes);
// Note: You could think but what if the texture is used as a regular non-frambuffer attachment texture
// surely it can't be memoryless then?
// That is true, but it can never happen as the fact these passes got merged means the textures cannot be used
// as regular textures halfway through a pass. If that were the case they would never have been merged in the first place.
// Except! If the pass consists of a single pass, in that case a texture could be allocated and freed within the single pass
// This is a somewhat degenerate case (e.g. a pass with culling forced off doing a uav write that is never used anywhere)
// But to avoid execution errors we still need to create the resource in this case.
// Check if it is in the destroy list of any of the subpasses > if yes > memoryless
foreach (ref readonly var subPass2 in graphPasses)
{
foreach (ref readonly var destroyedRes in subPass2.LastUsedResources(contextData))
{
ref var destInfo = ref contextData.UnversionedResourceData(destroyedRes);
if (destroyedRes.type == RenderGraphResourceType.Texture && destInfo.isImported == false)
{
if (createdRes.index == destroyedRes.index && !isGlobal)
{
// If a single pass in the native pass we need to check fragment attachment otherwise we're good
// we could always check this in theory but it's an optimization not to check it.
if (nativePass.numNativeSubPasses > 1 || subPass2.IsUsedAsFragment(createdRes, contextData))
{
createInfo.memoryLess = true;
destInfo.memoryLess = true;
}
}
}
}
}
}
}
}
}
}
}
internal static bool IsSameNativeSubPass(ref SubPassDescriptor a, ref SubPassDescriptor b)
{
if (a.flags != b.flags
|| a.colorOutputs.Length != b.colorOutputs.Length
|| a.inputs.Length != b.inputs.Length)
{
return false;
}
for (int i = 0; i < a.colorOutputs.Length; i++)
{
if (a.colorOutputs[i] != b.colorOutputs[i])
{
return false;
}
}
for (int i = 0; i < a.inputs.Length; i++)
{
if (a.inputs[i] != b.inputs[i])
{
return false;
}
}
return true;
}
private void ExecuteCreateRessource(InternalRenderGraphContext rgContext, RenderGraphResourceRegistry resources, in PassData pass)
{
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_ExecuteCreateResources)))
{
resources.forceManualClearOfResource = true;
// For raster passes we need to create resources for all the subpasses at the beginning of the native renderpass
if (pass.type == RenderGraphPassType.Raster && pass.nativePassIndex >= 0)
{
if (pass.mergeState == PassMergeState.Begin || pass.mergeState == PassMergeState.None)
{
ref var nativePass = ref contextData.nativePassData.ElementAt(pass.nativePassIndex);
foreach (ref readonly var subPass in nativePass.GraphPasses(contextData))
{
foreach (ref readonly var res in subPass.FirstUsedResources(contextData))
{
ref readonly var resInfo = ref contextData.UnversionedResourceData(res);
if (resInfo.isImported == false && resInfo.memoryLess == false)
{
bool usedAsFragmentThisPass = subPass.IsUsedAsFragment(res, contextData);
// This resource is read for the first time as a regular texture and not as a framebuffer attachment
// so we need to explicitly clear it, as loadAction.clear only works on framebuffer attachments
// TODO: Should this be a performance warning?? Maybe rare enough in practice?
resources.forceManualClearOfResource = !usedAsFragmentThisPass;
resources.CreatePooledResource(rgContext, res.iType, res.index);
}
}
}
}
}
// Other passes just create them at the beginning of the individual pass
else
{
foreach (ref readonly var create in pass.FirstUsedResources(contextData))
{
ref readonly var pointTo = ref contextData.UnversionedResourceData(create);
if (pointTo.isImported == false)
{
resources.CreatePooledResource(rgContext, create.iType, create.index);
}
}
}
resources.forceManualClearOfResource = true;
}
}
void DetermineLoadStoreActions(ref NativePassData nativePass)
{
using (new ProfilingScope(ProfilingSampler.Get(NativeCompilerProfileId.NRPRGComp_PrepareNativePass)))
{
ref readonly var firstGraphPass = ref contextData.passData.ElementAt(nativePass.firstGraphPass);
ref readonly var lastGraphPass = ref contextData.passData.ElementAt(nativePass.lastGraphPass);
// Some passes don't do any rendering only state changes so just skip them
// If these passes trigger any drawing the raster command buffer will warn users no render targets are set-up for their rendering
if (nativePass.fragments.size <= 0)
{
return;
}
// Some sanity checks, these should not happen
Debug.Assert(firstGraphPass.mergeState == PassMergeState.Begin || firstGraphPass.mergeState == PassMergeState.None);
Debug.Assert(lastGraphPass.mergeState == PassMergeState.End || lastGraphPass.mergeState == PassMergeState.None);
ref readonly var fragmentList = ref nativePass.fragments;
// determine load store actions
// This pass also contains the latest versions used within this pass
// As we have no pass reordering for now the merged passes are always a consecutive list and we can simply do a range
// check on the create/destroy passid to see if it's allocated/freed in this native renderpass
for (int fragmentId = 0; fragmentId < fragmentList.size; ++fragmentId)
{
ref readonly var fragment = ref fragmentList[fragmentId];
int idx = nativePass.attachments.Add(new NativePassAttachment());
ref var currAttachment = ref nativePass.attachments[idx];
#if UNITY_EDITOR
nativePass.loadAudit.Add(new LoadAudit(LoadReason.FullyRewritten));
ref var currLoadAudit = ref nativePass.loadAudit[idx];
nativePass.storeAudit.Add(new StoreAudit(StoreReason.DiscardUnused));
ref var currStoreAudit = ref nativePass.storeAudit[idx];
#endif
currAttachment.handle = fragment.resource;
currAttachment.mipLevel = fragment.mipLevel;
currAttachment.depthSlice = fragment.depthSlice;
// Don't care by default
currAttachment.loadAction = UnityEngine.Rendering.RenderBufferLoadAction.DontCare;
currAttachment.storeAction = UnityEngine.Rendering.RenderBufferStoreAction.DontCare;
// Writing by-default has to preserve the contents, think rendering only a few small triangles on top of a big framebuffer
// So it means we need to load/clear contents potentially.
// If a user pass knows it will write all pixels in a buffer (like a blit) it can use the WriteAll/Discard usage to indicate this to the graph
bool partialWrite = fragment.accessFlags.HasFlag(AccessFlags.Write) && !fragment.accessFlags.HasFlag(AccessFlags.Discard);
ref readonly var resourceData = ref contextData.UnversionedResourceData(fragment.resource);
bool isImported = resourceData.isImported;
int destroyPassID = resourceData.lastUsePassID;
bool usedAfterThisNativePass = (destroyPassID >= (nativePass.lastGraphPass + 1));
if (fragment.accessFlags.HasFlag(AccessFlags.Read) || partialWrite)
{
// The resource is already allocated before this pass so we need to load it
if (resourceData.firstUsePassID < nativePass.firstGraphPass)
{
currAttachment.loadAction = UnityEngine.Rendering.RenderBufferLoadAction.Load;
#if UNITY_EDITOR
currLoadAudit = new LoadAudit(LoadReason.LoadPreviouslyWritten, resourceData.firstUsePassID);
#endif
// Once we decide to load a resource, we must default to the Store action if the resource is used after the current native pass.
// If we were to use the DontCare action in this case, the driver would be effectively be allowed to discard the
// contents of the resource. This is true even when we're only performing reads on it.
if (usedAfterThisNativePass)
{
currAttachment.storeAction = RenderBufferStoreAction.Store;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit(StoreReason.StoreUsedByLaterPass, destroyPassID);
#endif
}
}
// It's first used this native pass so we need to clear it so reads/partial writes return the correct clear value
// the clear colors are part of the resource description and set-up when executing the graph we don't need to care about that here.
else
{
if (isImported)
{
// Check if the user indicated he wanted clearing of his imported resource on it's first use by the graph
if (resourceData.clear)
{
currAttachment.loadAction = UnityEngine.Rendering.RenderBufferLoadAction.Clear;
#if UNITY_EDITOR
currLoadAudit = new LoadAudit(LoadReason.ClearImported);
#endif
}
else
{
currAttachment.loadAction = UnityEngine.Rendering.RenderBufferLoadAction.Load;
#if UNITY_EDITOR
currLoadAudit = new LoadAudit(LoadReason.LoadImported);
#endif
}
}
else
{
// Created by the graph internally clear on first read
currAttachment.loadAction = UnityEngine.Rendering.RenderBufferLoadAction.Clear;
#if UNITY_EDITOR
currLoadAudit = new LoadAudit(LoadReason.ClearCreated);
#endif
}
}
}
if (fragment.accessFlags.HasFlag(AccessFlags.Write))
{
// Simple non-msaa case
if (nativePass.samples <= 1)
{
if (usedAfterThisNativePass)
{
// The resource is still used after this native pass so we need to store it.
currAttachment.storeAction = RenderBufferStoreAction.Store;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit(StoreReason.StoreUsedByLaterPass, destroyPassID);
#endif
}
else
{
// This is the last native pass that uses the resource.
// If it's imported, we store it because its contents may be used outside the graph.
// Otherwise, we can safely discard its contents.
//
// The one exception to this, is the user declared discard flag which allows us to assume an imported
// resource is not used outside the graph.
if (isImported)
{
if (resourceData.discard)
{
currAttachment.storeAction = RenderBufferStoreAction.DontCare;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit(StoreReason.DiscardImported);
#endif
}
else
{
currAttachment.storeAction = RenderBufferStoreAction.Store;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit(StoreReason.StoreImported);
#endif
}
}
else
{
currAttachment.storeAction = RenderBufferStoreAction.DontCare;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit(StoreReason.DiscardUnused);
#endif
}
}
}
// Complex msaa case
else
{
// The resource is still used after this native pass so we need to store it.
// as we don't know what happens with them and assume the contents are somewhow used outside the graph
// With MSAA we may access the resolved data for longer than the MSAA data so we track the destroyPass and lastPassThatNeedsUnresolved separately
// In theory the opposite could also be true (use MSAA after resolve data is no longer needed) but we consider it sufficiently strange to not
// consider it here.
currAttachment.storeAction = RenderBufferStoreAction.DontCare;
//Check if we're the last pass writing it by checking the output version of the current pass is the higherst version the resource will reach
bool lastWriter = (resourceData.latestVersionNumber == fragment.resource.version); // Cheaper but same? = resourceData.lastWritePassID >= pass.firstGraphPass && resourceData.lastWritePassID < pass.firstGraphPass + pass.numSubPasses;
bool isImportedLastWriter = isImported && lastWriter;
// Used outside this native render pass, we need to store something
if (destroyPassID >= nativePass.firstGraphPass + nativePass.numGraphPasses)
{
// Assume nothing is needed unless we are an imported texture (which doesn't require discarding) and we're the last ones writing it
bool needsMSAASamples = isImportedLastWriter && !resourceData.discard;
bool needsResolvedData = isImportedLastWriter && (resourceData.bindMS == false);//bindMS never resolves
int userPassID = 0;
int msaaUserPassID = 0;
// Check if we need msaa/resolved data by checking all the passes using this buffer
// Partial writes will register themselves as readers so this should be adequate
foreach (ref readonly var reader in contextData.Readers(fragment.resource))
{
ref var readerPass = ref contextData.passData.ElementAt(reader.passId);
bool isFragment = readerPass.IsUsedAsFragment(fragment.resource, contextData);
// Unsafe pass - we cannot know how it is used, so we need to both store and resolve
if (readerPass.type == RenderGraphPassType.Unsafe)
{
needsMSAASamples = true;
needsResolvedData = !resourceData.bindMS;
msaaUserPassID = reader.passId;
userPassID = reader.passId;
break;
}
// A fragment attachment use we need the msaa samples
else if (isFragment)
{
needsMSAASamples = true;
msaaUserPassID = reader.passId;
}
else
{
// Used as a multisample-texture we need the msaa samples
if (resourceData.bindMS)
{
needsMSAASamples = true;
msaaUserPassID = reader.passId;
}
// Used as a regular non-multisample texture we need resolved data
else
{
needsResolvedData = true;
userPassID = reader.passId;
}
}
}
if (needsMSAASamples && needsResolvedData)
{
currAttachment.storeAction = RenderBufferStoreAction.StoreAndResolve;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit(
(isImportedLastWriter) ? StoreReason.StoreImported : StoreReason.StoreUsedByLaterPass, userPassID,
(isImportedLastWriter) ? StoreReason.StoreImported : StoreReason.StoreUsedByLaterPass, msaaUserPassID);
#endif
}
else if (needsResolvedData)
{
currAttachment.storeAction = RenderBufferStoreAction.Resolve;
#if UNITY_EDITOR
currStoreAudit = new StoreAudit((isImportedLastWriter) ? StoreReason.StoreImported : StoreReason.StoreUsedByLaterPass, userPassID, StoreReason.DiscardUnused);