Refactoring

2026-01-14 15:48:43 +01:00 · 2018-11-01 15:17:13 +01:00
parent 064027fc0b
commit 2b899d1c80
10 changed files with 234 additions and 194 deletions
--- a/GPUSimulators/cuda/SWE2D_KP07_dimsplit.cu
+++ b/GPUSimulators/cuda/SWE2D_KP07_dimsplit.cu
@@ -38,39 +38,37 @@ void computeFluxF(float Q[3][BLOCK_HEIGHT+4][BLOCK_WIDTH+4],
    const int tx = threadIdx.x;
    const int ty = threadIdx.y;
    
-    {
-        int j=ty;
-        const int l = j + 2; //Skip ghost cells
-        for (int i=tx; i<BLOCK_WIDTH+1; i+=BLOCK_WIDTH) {
-            const int k = i + 1;
-            // Reconstruct point values of Q at the left and right hand side 
-            // of the cell for both the left (i) and right (i+1) cell 
-            const float3 Q_rl = make_float3(Q[0][l][k+1] - 0.5f*Qx[0][j][i+1],
-                                            Q[1][l][k+1] - 0.5f*Qx[1][j][i+1],
-                                            Q[2][l][k+1] - 0.5f*Qx[2][j][i+1]);
-            const float3 Q_rr = make_float3(Q[0][l][k+1] + 0.5f*Qx[0][j][i+1],
-                                            Q[1][l][k+1] + 0.5f*Qx[1][j][i+1],
-                                            Q[2][l][k+1] + 0.5f*Qx[2][j][i+1]);
-                                         
-            const float3 Q_ll = make_float3(Q[0][l][k] - 0.5f*Qx[0][j][i],
-                                            Q[1][l][k] - 0.5f*Qx[1][j][i],
-                                            Q[2][l][k] - 0.5f*Qx[2][j][i]);
-            const float3 Q_lr = make_float3(Q[0][l][k] + 0.5f*Qx[0][j][i],
-                                            Q[1][l][k] + 0.5f*Qx[1][j][i],
-                                            Q[2][l][k] + 0.5f*Qx[2][j][i]);
-                                    
-            //Evolve half a timestep (predictor step)
-            const float3 Q_r_bar = Q_rl + dt_/(2.0f*dx_) * (F_func(Q_rl, g_) - F_func(Q_rr, g_));
-            const float3 Q_l_bar = Q_lr + dt_/(2.0f*dx_) * (F_func(Q_ll, g_) - F_func(Q_lr, g_));
+    int j=ty;
+    const int l = j + 2; //Skip ghost cells
+    for (int i=tx; i<BLOCK_WIDTH+1; i+=BLOCK_WIDTH) {
+        const int k = i + 1;
+        // Reconstruct point values of Q at the left and right hand side 
+        // of the cell for both the left (i) and right (i+1) cell 
+        const float3 Q_rl = make_float3(Q[0][l][k+1] - 0.5f*Qx[0][j][i+1],
+                                        Q[1][l][k+1] - 0.5f*Qx[1][j][i+1],
+                                        Q[2][l][k+1] - 0.5f*Qx[2][j][i+1]);
+        const float3 Q_rr = make_float3(Q[0][l][k+1] + 0.5f*Qx[0][j][i+1],
+                                        Q[1][l][k+1] + 0.5f*Qx[1][j][i+1],
+                                        Q[2][l][k+1] + 0.5f*Qx[2][j][i+1]);
+                                     
+        const float3 Q_ll = make_float3(Q[0][l][k] - 0.5f*Qx[0][j][i],
+                                        Q[1][l][k] - 0.5f*Qx[1][j][i],
+                                        Q[2][l][k] - 0.5f*Qx[2][j][i]);
+        const float3 Q_lr = make_float3(Q[0][l][k] + 0.5f*Qx[0][j][i],
+                                        Q[1][l][k] + 0.5f*Qx[1][j][i],
+                                        Q[2][l][k] + 0.5f*Qx[2][j][i]);
+                                
+        //Evolve half a timestep (predictor step)
+        const float3 Q_r_bar = Q_rl + dt_/(2.0f*dx_) * (F_func(Q_rl, g_) - F_func(Q_rr, g_));
+        const float3 Q_l_bar = Q_lr + dt_/(2.0f*dx_) * (F_func(Q_ll, g_) - F_func(Q_lr, g_));

-            // Compute flux based on prediction
-            const float3 flux = CentralUpwindFlux(Q_l_bar, Q_r_bar, g_);
-            
-            //Write to shared memory
-            F[0][j][i] = flux.x;
-            F[1][j][i] = flux.y;
-            F[2][j][i] = flux.z;
-        }
+        // Compute flux based on prediction
+        const float3 flux = CentralUpwindFlux(Q_l_bar, Q_r_bar, g_);
+        
+        //Write to shared memory
+        F[0][j][i] = flux.x;
+        F[1][j][i] = flux.y;
+        F[2][j][i] = flux.z;
    }    
 }

@@ -178,7 +176,7 @@ __global__ void KP07DimsplitKernel(
    //Step 0 => evolve x first, then y
    if (step_ == 0) {
        //Compute fluxes along the x axis and evolve
-        minmodSlopeX(Q, Qx, theta_);
+        minmodSlopeX<w, h, gc, vars>(Q, Qx, theta_);
        __syncthreads();
        computeFluxF(Q, Qx, F, g_, dx_, dt_);
        __syncthreads();
@@ -194,7 +192,7 @@ __global__ void KP07DimsplitKernel(
        
        
        //Compute fluxes along the y axis and evolve
-        minmodSlopeY(Q, Qx, theta_);
+        minmodSlopeY<w, h, gc, vars>(Q, Qx, theta_);
        __syncthreads();
        
        computeFluxG(Q, Qx, F, g_, dy_, dt_);
@@ -205,7 +203,7 @@ __global__ void KP07DimsplitKernel(
    //Step 1 => evolve y first, then x
    else {
        //Compute fluxes along the y axis and evolve
-        minmodSlopeY(Q, Qx, theta_);
+        minmodSlopeY<w, h, gc, vars>(Q, Qx, theta_);
        __syncthreads();
        computeFluxG(Q, Qx, F, g_, dy_, dt_);
        __syncthreads();
@@ -219,7 +217,7 @@ __global__ void KP07DimsplitKernel(
        __syncthreads();
        
        //Compute fluxes along the x axis and evolve
-        minmodSlopeX(Q, Qx, theta_);
+        minmodSlopeX<w, h, gc, vars>(Q, Qx, theta_);
        __syncthreads();
        computeFluxF(Q, Qx, F, g_, dx_, dt_);
        __syncthreads();