#include #include #include #include #define SIZE 1024 void matmul_optimized(float** A, float** B, float** C, int n); int main() { int n = SIZE; // 分配内存空间 float** A = (float**)malloc(sizeof(float*) * n); float** B = (float**)malloc(sizeof(float*) * n); float** C = (float**)malloc(sizeof(float*) * n); int i, j; for(i=0; i