✨ Make it works with texture array that are wrote at the same time

davidAlgis · davidAlgis · commit ef6c8f10b90d · 2023-04-04T11:34:33.000+02:00
diff --git a/Plugin/PluginInteropUnityCUDA/include/Texture/texture.h b/Plugin/PluginInteropUnityCUDA/include/Texture/texture.h
@@ -106,7 +106,7 @@ class Texture
     UNITY_INTERFACE_EXPORT void *getNativeTexturePtr() const;
 
     /**
-     * Get the pointer of _surfObjArray
+     * Get the pointer of d_surfObjArray
      * This array of surface object is necessary
      * to write or read into a texture
      */
@@ -137,9 +137,15 @@ class Texture
 
     private:
     // An array of surface object that will be of the size of texture depth
+    // This array is allocate on host side and will be copy to device memory
+    // when texture is map to it
+    cudaSurfaceObject_t *_surfObjArray;
+
+    // A device array of surface object that will be of the size of texture depth
+    // This array is allocate on device memory.
     // the surface object is the object that you can used to write into texture
     // from cuda api (eg. with surf2DWrite)
-    cudaSurfaceObject_t *_surfObjArray;
+    cudaSurfaceObject_t *d_surfObjArray;
 
     dim3 _dimBlock;
     dim3 _dimGrid;
diff --git a/Plugin/PluginInteropUnityCUDA/src/Texture/texture.cpp b/Plugin/PluginInteropUnityCUDA/src/Texture/texture.cpp
@@ -29,6 +29,9 @@ Texture::Texture(void *textureHandle, int textureWidth, int textureHeight,
     // initialize surface object
     _surfObjArray = new cudaSurfaceObject_t[textureDepth];
 
+    CUDA_CHECK(cudaMalloc(&d_surfObjArray,
+                          _textureDepth * sizeof(cudaSurfaceObject_t)));
+
     for (int i = 0; i < textureDepth; i++)
     {
         _surfObjArray[i] = 0;
@@ -40,6 +43,7 @@ Texture::Texture(void *textureHandle, int textureWidth, int textureHeight,
 Texture::~Texture()
 {
     delete (_surfObjArray);
+    CUDA_CHECK(cudaFree(d_surfObjArray));
 }
 
 void Texture::mapTextureToSurfaceObject()
@@ -63,6 +67,9 @@ void Texture::mapTextureToSurfaceObject()
         CUDA_CHECK(cudaCreateSurfaceObject(&_surfObjArray[i], &resDesc));
         CUDA_CHECK(cudaGetLastError());
     }
+    CUDA_CHECK(cudaMemcpy(d_surfObjArray, _surfObjArray,
+                          _textureDepth * sizeof(cudaSurfaceObject_t),
+                          cudaMemcpyHostToDevice));
 }
 
 void Texture::unmapTextureToSurfaceObject()
@@ -108,7 +115,9 @@ void *Texture::getNativeTexturePtr() const
 
 cudaSurfaceObject_t *Texture::getSurfaceObjectArray() const
 {
-    return _surfObjArray;
+    // to use a complete array of surface object in a kernel,
+    // we need to use the array allocate on device memory
+    return d_surfObjArray;
 }
 
 cudaSurfaceObject_t Texture::getSurfaceObject(int indexInArray) const
@@ -121,5 +130,10 @@ cudaSurfaceObject_t Texture::getSurfaceObject(int indexInArray) const
         return 0;
     }
 
+    // to use a single surface object in a kernel
+    // we can use directly the surface object that 
+    // is on host side, because cudaSurfaceObject_t is a
+    // typename for unsigned long long which can be directly
+    // send to kernel as it's managed memory ? 
     return _surfObjArray[indexInArray];
 }
diff --git a/Plugin/SampleBasic/src/sample_kernels.cu b/Plugin/SampleBasic/src/sample_kernels.cu
@@ -56,11 +56,7 @@ void kernelCallerWriteTextureArray(const dim3 dimGrid, const dim3 dimBlock,
                                    const float time, const int width,
                                    const int height, const int depth)
 {
-
-    writeTex<<<dimGrid, dimBlock>>>(surfObjArray[0], width, height, time);
-
-    writeTex<<<dimGrid, dimBlock>>>(surfObjArray[1], width, height, 2*time);
-    // writeTexArray<<<dimGrid, dimBlock>>>(surfObjArray, width, height, depth, time);
+    writeTexArray<<<dimGrid, dimBlock>>>(surfObjArray, width, height, depth, time);
 }
 
 void kernelCallerWriteBuffer(const dim3 dimGrid, const dim3 dimBlock,

Original file line number	Diff line number	Diff line change
`@@ -29,6 +29,9 @@ Texture::Texture(void *textureHandle, int textureWidth, int textureHeight,`
`29`	`29`	`// initialize surface object`
`30`	`30`	`_surfObjArray = new cudaSurfaceObject_t[textureDepth];`
`31`	`31`
	`32`	`+ CUDA_CHECK(cudaMalloc(&d_surfObjArray,`
	`33`	`+ _textureDepth * sizeof(cudaSurfaceObject_t)));`
	`34`	`+`
`32`	`35`	`for (int i = 0; i < textureDepth; i++)`
`33`	`36`	`{`
`34`	`37`	`_surfObjArray[i] = 0;`
`@@ -40,6 +43,7 @@ Texture::Texture(void *textureHandle, int textureWidth, int textureHeight,`
`40`	`43`	`Texture::~Texture()`
`41`	`44`	`{`
`42`	`45`	`delete (_surfObjArray);`
	`46`	`+ CUDA_CHECK(cudaFree(d_surfObjArray));`
`43`	`47`	`}`
`44`	`48`
`45`	`49`	`void Texture::mapTextureToSurfaceObject()`
`@@ -63,6 +67,9 @@ void Texture::mapTextureToSurfaceObject()`
`63`	`67`	`CUDA_CHECK(cudaCreateSurfaceObject(&_surfObjArray[i], &resDesc));`
`64`	`68`	`CUDA_CHECK(cudaGetLastError());`
`65`	`69`	`}`
	`70`	`+ CUDA_CHECK(cudaMemcpy(d_surfObjArray, _surfObjArray,`
	`71`	`+ _textureDepth * sizeof(cudaSurfaceObject_t),`
	`72`	`+ cudaMemcpyHostToDevice));`
`66`	`73`	`}`
`67`	`74`
`68`	`75`	`void Texture::unmapTextureToSurfaceObject()`
`@@ -108,7 +115,9 @@ void *Texture::getNativeTexturePtr() const`
`108`	`115`
`109`	`116`	`cudaSurfaceObject_t *Texture::getSurfaceObjectArray() const`
`110`	`117`	`{`
`111`		`- return _surfObjArray;`
	`118`	`+ // to use a complete array of surface object in a kernel,`
	`119`	`+ // we need to use the array allocate on device memory`
	`120`	`+ return d_surfObjArray;`
`112`	`121`	`}`
`113`	`122`
`114`	`123`	`cudaSurfaceObject_t Texture::getSurfaceObject(int indexInArray) const`
`@@ -121,5 +130,10 @@ cudaSurfaceObject_t Texture::getSurfaceObject(int indexInArray) const`
`121`	`130`	`return 0;`
`122`	`131`	`}`
`123`	`132`
	`133`	`+ // to use a single surface object in a kernel`
	`134`	`+ // we can use directly the surface object that`
	`135`	`+ // is on host side, because cudaSurfaceObject_t is a`
	`136`	`+ // typename for unsigned long long which can be directly`
	`137`	`+ // send to kernel as it's managed memory ?`
`124`	`138`	`return _surfObjArray[indexInArray];`
`125`	`139`	`}`
Original file line number	Diff line number	Diff line change
`@@ -56,11 +56,7 @@ void kernelCallerWriteTextureArray(const dim3 dimGrid, const dim3 dimBlock,`
`56`	`56`	`const float time, const int width,`
`57`	`57`	`const int height, const int depth)`
`58`	`58`	`{`
`59`		`-`
`60`		`- writeTex<<<dimGrid, dimBlock>>>(surfObjArray[0], width, height, time);`
`61`		`-`
`62`		`- writeTex<<<dimGrid, dimBlock>>>(surfObjArray[1], width, height, 2*time);`
`63`		`- // writeTexArray<<<dimGrid, dimBlock>>>(surfObjArray, width, height, depth, time);`
	`59`	`+ writeTexArray<<<dimGrid, dimBlock>>>(surfObjArray, width, height, depth, time);`
`64`	`60`	`}`
`65`	`61`
`66`	`62`	`void kernelCallerWriteBuffer(const dim3 dimGrid, const dim3 dimBlock,`