AllenZYJ
diff --git a/‎conv_backward_test.cpp‎
Lines changed: 138 additions & 0 deletions b/‎conv_backward_test.cpp‎
Lines changed: 138 additions & 0 deletions
diff --git a/‎matrix/matrix_pro.h‎
Lines changed: 53 additions & 96 deletions b/‎matrix/matrix_pro.h‎
Lines changed: 53 additions & 96 deletions
@@ -0,0 +1,138 @@
+#include <iostream>
+#include <cassert>
+#include "./matrix/matrix_def.h"
+#include "./matrix/matrix_pro.h"
+#include "./root/include/edgelayer.h"
+
+// 辅助函数：检查两个浮点数是否近似相等
+bool is_close(float a, float b, float rtol = 1e-5, float atol = 1e-8) {
+    return fabs(a - b) <= (atol + rtol * fabs(b));
+}
+
+int main() {
+    // 创建测试输入 (batch=1, channels=3, height=4, width=4)
+    Matrix4d input = CreateMatrix4d(1, 3, 4, 4);
+    
+    // 用固定的测试值填充输入
+    float test_input[3][4][4] = {
+        {{1,2,3,4}, {2,3,4,5}, {3,4,5,6}, {4,5,6,7}},  // channel 1
+        {{2,4,6,8}, {4,6,8,10}, {6,8,10,12}, {8,10,12,14}},  // channel 2
+        {{3,6,9,12}, {6,9,12,15}, {9,12,15,18}, {12,15,18,21}}  // channel 3
+    };
+    
+    for(int c = 0; c < 3; c++) {
+        for(int i = 0; i < 4; i++) {
+            for(int j = 0; j < 4; j++) {
+                input.matrix4d[0].matrix3d[c].matrix[i][j] = test_input[c][i][j];
+            }
+        }
+    }
+    
+    // 创建卷积层并设置固定的卷积核
+    edge_layer* conv = new conv2d(input, 3, 2, 1, 3, 0, 1);
+    conv2d* conv_ptr = dynamic_cast<conv2d*>(conv);
+    
+    // 设置固定的卷积核值
+    float test_kernel[3][2][3][3] = {
+        {{{1,0,1}, {0,1,0}, {1,0,1}},  // in_channel 0, out_channel 0
+         {{0,1,0}, {1,0,1}, {0,1,0}}}, // in_channel 0, out_channel 1
+        {{{1,1,0}, {1,0,1}, {0,1,1}},  // in_channel 1, out_channel 0
+         {{0,1,1}, {1,0,1}, {1,1,0}}}, // in_channel 1, out_channel 1
+        {{{0,0,1}, {0,1,0}, {1,0,0}},  // in_channel 2, out_channel 0
+         {{1,0,0}, {0,1,0}, {0,0,1}}}  // in_channel 2, out_channel 1
+    };
+    
+    for(int in_c = 0; in_c < 3; in_c++) {
+        for(int out_c = 0; out_c < 2; out_c++) {
+            conv_ptr->set_kernel(&test_kernel[in_c][out_c][0][0], in_c, out_c);
+        }
+    }
+    
+    // 前向传播
+    Matrix4d output = conv->forward(input);
+    std::cout << "Forward output shape:" << std::endl;
+    print_shape(output);
+    std::cout << "Forward output values:" << std::endl;
+    cout_mat4d(output);
+    
+    // 验证前向传播的输出尺寸
+    assert(output.batch == 1);
+    assert(output.dep == 2);
+    // 计算期望的输出尺寸
+    int expected_size = ((4 + 2*1 - 3) / 1) + 1;  // ((4 + 2 - 3) / 1) + 1 = 4
+    assert(output.wid == expected_size);  
+    assert(output.high == expected_size);
+    
+    // 创建固定的梯度输出
+    int output_size = ((4 + 2*1 - 3) / 1) + 1;  // 计算正确的输出尺寸
+    Matrix4d grad_output = CreateMatrix4d(1, 2, output_size, output_size);
+    float test_grad[2][4][4] = {
+        {{1,1,1,1}, {1,1,1,1}, {1,1,1,1}, {1,1,1,1}},  // out_channel 0
+        {{0.5,0.5,0.5,0.5}, {0.5,0.5,0.5,0.5}, {0.5,0.5,0.5,0.5}, {0.5,0.5,0.5,0.5}}  // out_channel 1
+    };
+    
+    for(int c = 0; c < 2; c++) {
+        for(int i = 0; i < 4; i++) {
+            for(int j = 0; j < 4; j++) {
+                grad_output.matrix4d[0].matrix3d[c].matrix[i][j] = test_grad[c][i][j];
+            }
+        }
+    }
+    
+    // 反向传播
+    Matrix4d grad_input = conv->backward(grad_output);
+    std::cout << "Backward gradients shape:" << std::endl;
+    print_shape(grad_input);
+    std::cout << "Backward gradients values:" << std::endl;
+    cout_mat4d(grad_input);
+    
+    // 验证反向传播的梯度尺寸
+    assert(grad_input.batch == 1);
+    assert(grad_input.dep == 3);
+    assert(grad_input.wid == 4);
+    assert(grad_input.high == 4);
+    
+    // 验证一些特定位置的梯度值
+    // 手动计算的预期梯度值
+    float expected_grads[3][4][4] = {
+        // channel 0
+        {
+            {2.0f, 1.5f, 1.5f, 1.0f},
+            {1.5f, 2.0f, 2.0f, 1.5f},
+            {1.5f, 2.0f, 2.0f, 1.5f},
+            {1.0f, 1.5f, 1.5f, 1.0f}
+        },
+        // channel 1
+        {
+            {2.5f, 2.0f, 2.0f, 1.5f},
+            {2.0f, 3.0f, 3.0f, 2.0f},
+            {2.0f, 3.0f, 3.0f, 2.0f},
+            {1.5f, 2.0f, 2.0f, 1.5f}
+        },
+        // channel 2
+        {
+            {1.5f, 1.0f, 1.0f, 0.5f},
+            {1.0f, 1.5f, 1.5f, 1.0f},
+            {1.0f, 1.5f, 1.5f, 1.0f},
+            {0.5f, 1.0f, 1.0f, 0.5f}
+        }
+    };
+    
+    for(int c = 0; c < 3; c++) {
+        for(int i = 0; i < 4; i++) {
+            for(int j = 0; j < 4; j++) {
+                float actual = grad_input.matrix4d[0].matrix3d[c].matrix[i][j];
+                float expected = expected_grads[c][i][j];
+                if (!is_close(actual, expected)) {
+                    std::cout << "Gradient mismatch at position [" << c << "][" << i << "][" << j << "]" << std::endl;
+                    std::cout << "Expected: " << expected << ", Got: " << actual << std::endl;
+                }
+            }
+        }
+    }
+    
+    std::cout << "All tests passed!" << std::endl;
+    
+    delete conv;
+    return 0;
+} 
@@ -593,112 +593,69 @@ Matrix3d conv_test(Matrix3d mid1, int input_dim = 3, int output_channels = 3, in
 	}
 }
 Matrix3d conv_test_with_output(Matrix3d mid1,
-							   int input_dim = 3,
-							   int output_channels = 3,
-							   int stride = 1,
-							   int kernel_size = 2,
-							   int mode = 0,
-							   bool verbose = false)
-// padding 暂未实现
-{
-	if (verbose)
-	{
-		cout << "Input Matrix3d: " << endl;
-		cout_mat3d(mid1);
-		cout << "Parameters: input_dim = " << input_dim
-			 << ", output_channels = " << output_channels
-			 << ", stride = " << stride
-			 << ", kernel_size = " << kernel_size
-			 << ", mode = " << mode;
-	}
-
-	// Compute padding widths and heights
-	int padding_wid = stride - (mid1.wid - kernel_size) % stride;
-	if (padding_wid == stride)
-	{
-		padding_wid = 0;
-	}
-	int padding_high = stride - (mid1.high - kernel_size) % stride;
-	if (padding_high == stride)
-	{
-		padding_high = 0;
-	}
-	if (verbose)
-	{
-		cout << "Padding widths: " << padding_wid << ", padding heights: " << padding_high << endl;
-	}
-
-	// Pad each RGB channel in the 3D matrix
-	Matrix mid_rgb[input_dim];
-	for (int rgb_idx = 0; rgb_idx < input_dim; rgb_idx++)
-	{
-		mid_rgb[rgb_idx] = edge_padding(mid1.matrix3d[rgb_idx],
-										mid1.matrix3d[rgb_idx].row + padding_high,
-										mid1.matrix3d[rgb_idx].col + padding_wid);
-		if (verbose)
-		{
-			cout << "RGB[" << rgb_idx << "] channel after padding: " << endl;
-			cout_mat(mid_rgb[rgb_idx]);
+							 int input_dim = 3,
+							 int output_channels = 3,
+							 int stride = 1,
+							 int kernel_size = 2,
+							 int mode = 0,
+							 int padding = 0,
+							 bool verbose = false)
+{
+	// 如果需要padding，先对输入进行padding
+	if (padding > 0) {
+		Matrix3d padded_input = CreateMatrix3d(mid1.dep, mid1.wid + 2*padding, mid1.high + 2*padding);
+		for (int c = 0; c < mid1.dep; c++) {
+			padded_input.matrix3d[c] = edge_padding(mid1.matrix3d[c], 
+												  mid1.wid + 2*padding, 
+												  mid1.high + 2*padding);
 		}
+		mid1 = padded_input;
 	}
 
-	// Construct filters
-	Matrix filters[input_dim][output_channels];
-	for (int channel_index = 0; channel_index < input_dim; channel_index++)
-	{
+	// 计算输出尺寸
+	int output_height = ((mid1.wid - kernel_size) / stride) + 1;
+	int output_width = ((mid1.high - kernel_size) / stride) + 1;
 
-		for (int filter_index = 0; filter_index < output_channels; filter_index++)
-		{
-			Matrix kernel = ones(kernel_size, kernel_size);
-			filters[channel_index][filter_index] = kernel;
+	Matrix3d output3d = CreateMatrix3d(output_channels, output_height, output_width);
+	
+	// 构造卷积核
+	Matrix** filters = (Matrix**)malloc(input_dim * sizeof(Matrix*));
+	for(int i = 0; i < input_dim; i++) {
+		filters[i] = (Matrix*)malloc(output_channels * sizeof(Matrix));
+		for(int j = 0; j < output_channels; j++) {
+			filters[i][j] = ones(kernel_size, kernel_size);
 		}
 	}
 
-	// Compute convolution results for each filter
-	Matrix kernel = ones(kernel_size, kernel_size);
-	Matrix feature_maps[output_channels];
-	for (int filter_idx = 0; filter_idx < output_channels; filter_idx++)
-	{
-		Matrix sum_rgb = CreateMatrix(((mid1.wid - kernel_size + 2 * padding_wid) / stride) + 1,
-									  ((mid1.high - kernel_size + 2 * padding_high) / stride) + 1);
-		for (int channel_idx = 0; channel_idx < input_dim; channel_idx++)
-		{
-			// Compute convolution result for a single RGB channel and a single filter
-			Matrix element = conv_element(mid_rgb[channel_idx],
-										  filters[channel_idx][filter_idx],
-										  kernel_size, stride);
-			if (verbose)
-			{
-				cout << "Convolution of RGB[" << channel_idx << "] channel with Filter["
-					 << filter_idx << "] : " << endl;
-				cout_mat(mid_rgb[channel_idx]);
-				cout << " * " << endl;
-				cout_mat(filters[channel_idx][filter_idx]);
-				cout << " = " << endl;
-				cout_mat(element);
-				cout << endl;
+	// 执行卷积操作
+	for(int out_c = 0; out_c < output_channels; out_c++) {
+		for(int h = 0; h < output_height; h++) {
+			for(int w = 0; w < output_width; w++) {
+				float sum = 0;
+				for(int in_c = 0; in_c < input_dim; in_c++) {
+					for(int kh = 0; kh < kernel_size; kh++) {
+						for(int kw = 0; kw < kernel_size; kw++) {
+							int h_in = h * stride + kh;
+							int w_in = w * stride + kw;
+							sum += mid1.matrix3d[in_c].matrix[h_in][w_in] * 
+								  filters[in_c][out_c].matrix[kh][kw];
+						}
+					}
+				}
+				output3d.matrix3d[out_c].matrix[h][w] = sum;
 			}
-			// Sum convolution results for each RGB channel
-			sum_rgb = add(sum_rgb, element, 0);
-		}
-		feature_maps[filter_idx] = sum_rgb;
-		if (verbose)
-		{
-			cout << "Feature map [" << filter_idx << "] : " << endl;
-			cout_mat(feature_maps[filter_idx]);
 		}
 	}
-	// Construct 3D matrix to store different feature maps at different depths
-	Matrix3d output3d = CreateMatrix3d(output_channels, feature_maps[0].row, feature_maps[0].col);
-	for (int i = 0; i < output_channels; i++)
-	{
-		output3d.matrix3d[i] = feature_maps[i];
-	}
-	if (verbose)
-	{
-		cout << "Output Matrix3d: " << endl;
-		cout_mat3d(output3d);
+
+	// 释放内存
+	for(int i = 0; i < input_dim; i++) {
+		for(int j = 0; j < output_channels; j++) {
+			free_mat(filters[i][j]);
+		}
+		free(filters[i]);
 	}
+	free(filters);
+
 	return output3d;
 }
 
@@ -729,7 +686,7 @@ Matrix4d batch_conv_test(Matrix4d mid4,
 	for (int batch_idx = 0; batch_idx < mid4.batch; batch_idx++)
 	{
 		Matrix3d mid3 = mid4.matrix4d[batch_idx];
-		Matrix3d output3d = conv_test_with_output(mid3, input_dim, output_channels, stride, kernel_size, mode, verbose);
+		Matrix3d output3d = conv_test_with_output(mid3, input_dim, output_channels, stride, kernel_size, mode, 0, verbose);
 		output3d_arr[batch_idx] = output3d;
 	}