hadamard: consider channel_data_stride in offset calculations - ogl_beamforming - Ultrasound Beamforming Implemented with OpenGL

Commit: bc9501d0dc21b40d20e3be5e1d560923befe75fd
Parent: b7dbc9dd661a816a5d223e5c7e16abf4bcca7235
Author: Randy Palamar
Date:   Wed, 10 Jul 2024 10:33:15 -0600

hadamard: consider channel_data_stride in offset calculations

Diffstat:
M beamformer.c  | 2 +-
M beamformer_parameters.h  | 1 +
M shaders/hadamard.glsl  | 37 ++++++++++++++++++++++---------------

3 files changed, 24 insertions(+), 16 deletions(-)
diff --git a/beamformer.c b/beamformer.c
@@ -6,7 +6,7 @@ alloc_shader_storage(BeamformerCtx *ctx, Arena a)
 {
 	uv4 rf_data_dim        = ctx->params->rf_data_dim;
 	ctx->csctx.rf_data_dim = rf_data_dim;
-	size rf_raw_size       = rf_data_dim.x * rf_data_dim.y * rf_data_dim.z * sizeof(i16);
+	size rf_raw_size       = ctx->params->channel_data_stride * rf_data_dim.y * rf_data_dim.z * sizeof(i16);
 	size rf_decoded_size   = rf_data_dim.x * rf_data_dim.y * rf_data_dim.z * sizeof(f32);
 
 	glDeleteBuffers(ARRAY_COUNT(ctx->csctx.rf_data_ssbos), ctx->csctx.rf_data_ssbos);
diff --git a/beamformer_parameters.h b/beamformer_parameters.h
@@ -16,4 +16,5 @@ typedef struct {
 	f32 speed_of_sound;         /* [m/s] */
 	f32 sampling_frequency;     /* [Hz]  */
 	f32 focal_depth;            /* [m]   */
+	f32 _pad[3];
 } BeamformerParameters;
diff --git a/shaders/hadamard.glsl b/shaders/hadamard.glsl
@@ -33,41 +33,48 @@ layout(std140, binding = 0) uniform parameters {
 void main()
 {
 	/* NOTE: each invocation takes a time sample (row) and a receive channel (column).
-	 * it does the dot product of that column with the equivalent row of the hadamard matrix.
-	 * the result is stored to the same row, column index of the output data.
+	 * It first maps the the column to the correct column in the rf data then
+	 * does the dot product with the equivalent row of the hadamard matrix.
+	 * The result is stored to the equivalent row, column index of the output.
 	 */
 	uint time_sample = gl_GlobalInvocationID.x;
 	uint channel     = gl_GlobalInvocationID.y;
 	uint acq         = gl_GlobalInvocationID.z;
 
-	/* offset to get the correct column in hadamard matrix */
+	/* NOTE: offset to get the correct column in hadamard matrix */
 	uint hoff = rf_data_dim.z * acq;
 
-	/* TODO: make sure incoming data is organized so that stride is 1
-	 * i.e. each column should be a single time sample for all channels
-	 * alternatively we can tell opengl to store the rf data in row major order
-	 */
+	/* NOTE: offsets for storing the results in the output data */
+	uint out_stride = rf_data_dim.x * rf_data_dim.y;
+	uint out_off    = rf_data_dim.x * channel + time_sample;
+
+	/* TODO: channel_mapping */
+	//uint ch_base_idx = (channel + channel_offset) / 4;
+	//uint ch_sub_idx  = (channel + channel_offset) - ch_base_idx;
+	//uint rf_channel  = channel_mapping[ch_base_idx][ch_sub_idx];
+	uint rf_channel = channel;
 
-	/* offset to get the time sample and row in rf data */
-	uint rstride = rf_data_dim.x * rf_data_dim.y;
-	uint rfoff   = rf_data_dim.x * channel + time_sample;
+	/* NOTE: offsets to get the time sample and row in rf data */
+	uint rf_stride = channel_data_stride * rf_data_dim.y;
+	uint rf_off    = channel_data_stride * rf_channel + time_sample;
 
-	uint ridx       = rfoff / 2;
-	uint ridx_delta = rstride / 2;
+	/* NOTE: rf_data index and stride considering the data is i16 not i32 */
+	uint ridx       = rf_off / 2;
+	uint ridx_delta = rf_stride / 2;
 
 	/* NOTE: rf_data is i16 so each access grabs two time samples at time.
 	 * We need to shift arithmetically (maintaining the sign) to get the
 	 * desired element. If the time sample is even we take the upper half
 	 * and if its odd we take the lower half. */
-	uint lfs = ~(time_sample & 1) * 16;
+	uint lfs = ~(time_sample & 1u) * 16;
 
 	/* NOTE: Compute N-D dot product */
 	int sum = 0;
 	for (int i = 0; i < rf_data_dim.z; i++) {
 		int data = (rf_data[ridx] << lfs) >> 16;
-		sum += hadamard[hoff + i] * data;
+		sum  += hadamard[hoff + i] * data;
 		ridx += ridx_delta;
 	}
 
-	out_data[rfoff + rstride * acq] = float(sum);
+	out_data[out_off + out_stride * acq] = float(sum);
 }

M	beamformer.c	\|	2	+-
M	beamformer_parameters.h	\|	1	+
M	shaders/hadamard.glsl	\|	37	++++++++++++++++++++++---------------