aaa

2024-05-06 09:58:27 +10:00
parent 52baa303dc
commit dba69f9470
14 changed files with 172 additions and 35 deletions
--- a/src/main/resources/assets/voxy/shaders/heriacial_selector/hierarchical_worker.comp
+++ b/src/main/resources/assets/voxy/shaders/heriacial_selector/hierarchical_worker.comp
@@ -0,0 +1,32 @@
+#version 460
+
+layout(local_size_x=8)
+
+
+
+
+//NEW IDEAm use the depth buffer directly to compute the lod level needed to cover it
+
+
+
+
+//Location in world space up to 2x2x2 block size resolution
+#define OctNodeTask uint64_t
+
+
+
+//First 32 bits are the start of child
+// next 16 bits are split into 8 pairs, each pair specifies the type of the subnode (air/empty, partial, full)
+
+
+
+//Tasks are of size uint64_t
+
+
+
+void main() {
+    while (true) {
+        barrier();
+
+    }
+}
--- a/src/main/resources/assets/voxy/shaders/heriacial_selector/persistent_threads.comp
+++ b/src/main/resources/assets/voxy/shaders/heriacial_selector/persistent_threads.comp
@@ -0,0 +1,37 @@
+#version 460
+
+#define WAVE_SIZE 64
+layout(local_size_x=WAVE_SIZE)
+
+#define WorkTask
+
+
+//or make the shape 4x2x4 which has a local size of 32
+
+
+//The work queue is a circular queue with collision detection and abortion
+struct WorkQueueHeader {
+    uint queueSizeBits;
+    uint start;
+    uint end;
+    uint _padd;
+};
+
+
+//Task is a uint32,
+
+//The idea is to use persistent threads + octree culling to recursivly find bottom level sections that satisfy a pixel density requirement
+// given a matrix
+void main() {
+    while (true) {
+
+    }
+}
+
+
+
+//Idea cull/recuse in a manor of 4x4x4 cube (64 bits), have an existance mask per section so that unnessasery computation isnt done on air subsections
+// if a section is fully or partially visible and its aabb does not occupy 1 pixel (or a subset of some specified area/density)
+// then enqueue that section as a job
+// once a node has reached its tail ending, check if its loaded or not, if not, request it to be loaded
+// note that the cpu side can discard sections if they are superceeded by a higher level lod load request etc
--- a/src/main/resources/assets/voxy/shaders/heriacial_selector/traversal.comp
+++ b/src/main/resources/assets/voxy/shaders/heriacial_selector/traversal.comp
@@ -0,0 +1,24 @@
+#version 460
+
+layout(local_size_x=32)
+
+//Works in multiple parts
+// first is a downwards traversal from a base level that finds all the bottom level pixel detail AABBs
+// task queue is firstly filled with large visible AABB's from rastered occlusion
+//
+// each node metadata contains the position in 3d space relative to the toplevel node
+// an offset into the datapool for the child nodes, and union between (a bitmsk of if a child node is full, empty, or mixed (or unloaded))
+//  and a pointer to render metadata for meshlets
+
+
+//The overarching idea is to have meshlets be automatatically selected based on the resulting pixel size/density
+// after 3d projection, we dont want subpixel triangles and we want to be able to automatically account for the
+// perspective warp on the edges of the screen (e.g. high fov == higher density at the center of the screen)
+// from this, the gpu can then (if they are not present) request meshlets be added and thereby automatic lod selection
+// and dynamic building resulting in possibly O(fast) rendering
+void main() {
+    while (true) {
+        barrier();
+
+    }
+}
--- a/src/main/resources/assets/voxy/shaders/lod/gl46mesh/meshlet.glsl
+++ b/src/main/resources/assets/voxy/shaders/lod/gl46mesh/meshlet.glsl
@@ -17,7 +17,7 @@ uint extractDetail(PosHeader pos64) {
    return uint(pos64>>60);
 }
 uvec3 extractMin(AABBHeader aabb) {
-    return uvec3(uint(aabb&0xFF),uint((aabb>>8)&0xFF),uint((aabb>>16)&0xFF));
+    return uvec3(uint(uint(aabb)&0xFF),uint((uint(aabb)>>8)&0xFF),uint((uint(aabb)>>16)&0xFF));
 }
 uvec3 extractMax(AABBHeader aabb) {
    return uvec3(uint((aabb>>24)&0xFF),uint((aabb>>32)&0xFF),uint((aabb>>40)&0xFF));
--- a/src/main/resources/assets/voxy/shaders/lod/gl46mesh/meshletculler.comp
+++ b/src/main/resources/assets/voxy/shaders/lod/gl46mesh/meshletculler.comp
@@ -16,14 +16,18 @@ vec3 proj(vec3 pos) {
 bool testHiZ(PosHeader secPos, AABBHeader aabb) {
    ivec3 section = extractPosition(secPos);
    uint detail = extractDetail(secPos);
-    ivec3 pos = (((section<<detail)-baseSectionPos)<<5);
-    uvec3 cmin = extractMin(aabb)*(1<<detail);
-    uvec3 cmax = extractMax(aabb)*(1<<detail);
+    vec3 pos = vec3(ivec3(((section<<detail)-baseSectionPos)<<5));
+    vec3 cmin = ivec3(extractMin(aabb)*(1<<detail));
+    vec3 cmax = ivec3((extractMax(aabb)+1)*(1<<detail));

-    vec3 minBB = proj(pos);
+
+    //TODO:FIXME: either pos,cmin,cmax isnt correct, aswell as the miplevel isnt correct as its sampling at the wrong detail level
+
+    vec3 minBB = proj(pos + cmin);//
    vec3 maxBB = minBB;
+
    for (int i = 1; i < 8; i++) {
-        vec3 point = proj(pos+mix(cmin, cmax, bvec3((i&1)!=0,(i&2)!=0,(i&4)!=0)));
+        vec3 point = proj(pos + mix(cmin, cmax, bvec3((i&1)!=0,(i&2)!=0,(i&4)!=0)));
        minBB = min(minBB, point);
        maxBB = max(maxBB, point);
    }
@@ -32,7 +36,7 @@ bool testHiZ(PosHeader secPos, AABBHeader aabb) {
    maxBB = maxBB*0.5+0.5;

    vec2 size = (maxBB.xy - minBB.xy) * vec2(screensize);
-    float miplevel = ceil(log2(max(size.x, size.y)/2));//NOTE: the /2 is cause the mipmaps dont include bottom level depth
+    float miplevel = ceil(log2(max(size.x, size.y)));//NOTE: the /2 is cause the mipmaps dont include bottom level depth

    float a = textureLod(hizSampler,minBB.xy,miplevel).r;
    float b = textureLod(hizSampler,vec2(minBB.x,maxBB.y),miplevel).r;
@@ -59,7 +63,7 @@ void main() {
    PosHeader pos   = geometryPool[meshletId*MESHLET_SIZE];
    AABBHeader aabb = geometryPool[meshletId*MESHLET_SIZE+1];

-    if (true||testHiZ(pos, aabb)) {//If didnt cull, insert it back into the stream
+    if (testHiZ(pos, aabb)) {//If didnt cull, insert it back into the stream
        meshlets[atomicAdd(drawCmd.instanceCount, 1)+fullMeshletCount] = meshletId;
    }
 }
--- a/src/main/resources/assets/voxy/shaders/lod/gl46mesh/quads.frag
+++ b/src/main/resources/assets/voxy/shaders/lod/gl46mesh/quads.frag
@@ -19,7 +19,7 @@ void main() {
    //vec4 colour = solidColour;
    vec4 colour = texture(blockModelAtlas, uv + baseUV, ((flags>>1)&1u)*-4.0);
    if ((flags&1u) == 1 && colour.a <= 0.25f) {
-        discard;
+        //discard;
    }

    //Conditional tinting, TODO: FIXME: REPLACE WITH MASK OR SOMETHING, like encode data into the top bit of alpha
@@ -31,12 +31,11 @@ void main() {

    //outColour = vec4(uv + baseUV, 0, 1);

-    /*
+
    uint hash = meshlet*1231421+123141;
    hash ^= hash>>16;
    hash = hash*1231421+123141;
    hash ^= hash>>16;
-
-    outColour = vec4(float(hash&15u)/15, float((hash>>4)&15u)/15, float((hash>>8)&15u)/15, 1);
-    */
+    hash = hash * 1827364925 + 123325621;
+    //outColour = vec4(float(hash&15u)/15, float((hash>>4)&15u)/15, float((hash>>8)&15u)/15, 1);
 }
--- a/src/main/resources/assets/voxy/shaders/lod/gl46mesh/quads.vert
+++ b/src/main/resources/assets/voxy/shaders/lod/gl46mesh/quads.vert
@@ -84,6 +84,7 @@ void main() {
    uint lodLevel = extractDetail(meshletPosition);
    ivec3 sectionPos = extractPosition(meshletPosition);

+    //meshlet = (meshlet<<5)|(gl_VertexID>>2);