summaryrefslogtreecommitdiff
path: root/src/gpu/effects
diff options
context:
space:
mode:
authorskal <pascal.massimino@gmail.com>2026-02-14 00:27:53 +0100
committerskal <pascal.massimino@gmail.com>2026-02-14 00:27:53 +0100
commitf7c5c19af1b4638958c6875c6f691b2c9aa05a94 (patch)
tree9d561ea294f93640100f69a6ad80ff7f0fd41b43 /src/gpu/effects
parent71ff356ef03b5d07bcd7a36b79cf95df1206717b (diff)
CNN v2: Fix weight buffer offset bug
Root cause: Binary format is [header:20B][layer_info:20B×N][weights]. Both cnn_test and CNNv2Effect uploaded entire file to weights_buffer, but shader reads weights_buffer[0] expecting first weight, not header. Fix: Skip header + layer_info when uploading to GPU buffer. - cnn_test.cc: Calculate weights_offset, upload only weights section - cnn_v2_effect.cc: Same fix for runtime effect Before: layer_0 output showed [R, uv_x, uv_y, black] (wrong channels) After: layer_0 output shows [R, G, B, D] (correct identity mapping) Tests: 34/36 passing (2 unrelated failures)
Diffstat (limited to 'src/gpu/effects')
-rw-r--r--src/gpu/effects/cnn_v2_effect.cc14
1 files changed, 9 insertions, 5 deletions
diff --git a/src/gpu/effects/cnn_v2_effect.cc b/src/gpu/effects/cnn_v2_effect.cc
index 3985723..366a232 100644
--- a/src/gpu/effects/cnn_v2_effect.cc
+++ b/src/gpu/effects/cnn_v2_effect.cc
@@ -111,17 +111,21 @@ void CNNv2Effect::load_weights() {
layer_info_.push_back(info);
}
- // Create GPU storage buffer for weights
- // Buffer contains: header + layer info + packed f16 weights (as u32)
+ // Create GPU storage buffer for weights (skip header + layer info, upload only weights)
+ size_t header_size = 20; // 5 u32
+ size_t layer_info_size = 20 * num_layers; // 5 u32 per layer
+ size_t weights_offset = header_size + layer_info_size;
+ size_t weights_only_size = weights_size - weights_offset;
+
WGPUBufferDescriptor buffer_desc = {};
- buffer_desc.size = weights_size;
+ buffer_desc.size = weights_only_size;
buffer_desc.usage = WGPUBufferUsage_Storage | WGPUBufferUsage_CopyDst;
buffer_desc.mappedAtCreation = false;
weights_buffer_ = wgpuDeviceCreateBuffer(ctx_.device, &buffer_desc);
- // Upload weights data
- wgpuQueueWriteBuffer(ctx_.queue, weights_buffer_, 0, weights_data, weights_size);
+ // Upload only weights (skip header + layer info)
+ wgpuQueueWriteBuffer(ctx_.queue, weights_buffer_, 0, weights_data + weights_offset, weights_only_size);
// Create uniform buffers for layer params (one per layer)
for (uint32_t i = 0; i < num_layers; ++i) {