From cf609ac7b2da945c74a0b2398074df8d72357342 Mon Sep 17 00:00:00 2001 From: AZEN-SGG Date: Fri, 28 Mar 2025 01:24:34 +0300 Subject: [PATCH] Linux part was done --- 2025.03.28/dist/Linux/Makefile | 2 +- 2025.03.28/dist/Linux/solve.c | 115 +++++++++++++++++++++++++++++++++ 2025.03.28/dist/Linux/solve.h | 2 + 3 files changed, 118 insertions(+), 1 deletion(-) diff --git a/2025.03.28/dist/Linux/Makefile b/2025.03.28/dist/Linux/Makefile index f00a3fd..2dc4886 100644 --- a/2025.03.28/dist/Linux/Makefile +++ b/2025.03.28/dist/Linux/Makefile @@ -5,7 +5,7 @@ FLAGS = -fstack-protector-all -W -Wall -Wextra -Wunused -Wcast-align -Werror -pe %.o: %.c gcc -c $(FLAGS) $< -all: a01.out a02.out a03.out a04.out a05.out a06.out a07.out a08.out +all: a01.out a02.out a03.out a04.out a05.out a06.out a07.out a08.out a09.out a10.out solve.o: solve.c solve.h array_io.o: array_io.c array_io.h diff --git a/2025.03.28/dist/Linux/solve.c b/2025.03.28/dist/Linux/solve.c index 78e74e8..f9ec657 100644 --- a/2025.03.28/dist/Linux/solve.c +++ b/2025.03.28/dist/Linux/solve.c @@ -444,3 +444,118 @@ void t8_solve(const double * restrict A, double * restrict x_0, const double * r } } +void t9_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, int n, int m, double t) +{ + for (int k = 0; k < m; ++k) + { + double * swap_temp; + + for (int i = n-1; i >= 0; --i) + { + double sum_x = 0; + double sum_r = 0; + double temp = 0; + double aii = A[i*n + i]; + + #pragma omp simd reduction(+:sum_x, sum_r) + for (int j = n-1; j > i; --j) + { + double aij = A[i*n + j]; + double rj = aij * x_0[j]; + sum_x += rj - aij * x[j]; + sum_r += rj; + } + + temp = aii * x_0[i]; + sum_x += temp; + sum_r += temp; + + #pragma omp simd reduction(+:sum_r) + for (int j = i-1; j >= 0; --j) + sum_r += A[i*n + j] * x_0[j]; + + x[i] = (sum_x + (b[i] - sum_r) * t) / aii; + } + + swap_temp = x; + x = x_0; + x_0 = swap_temp; + } + + if (m % 2 == 0) // Проверил 100 раз + for (int i = 0; i < n; i++) + { + double temp = x[i]; + x[i] = x_0[i]; + x_0[i] = temp; + } + else + { + double * swap_temp = x; + x = x_0; + x_0 = swap_temp; + } +} + +void t10_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, double * restrict r, double * restrict w, int n, int m, double t) +{ + for (int k = 0; k < m; ++k) + { + double *swap_temp = 0; + + #pragma omp parallel for + for (int i = 0; i < n; ++i) + { + double sum = 0; + #pragma omp simd reduction(+:sum) + for (int j = 0; j < n; ++j) + sum += A[i*n + j] * x_0[j]; + r[i] = (b[i] - sum) * t; + } + + for (int i = 0; i < n; ++i) + { + double sum = r[i]; + double inai = 0; + + #pragma omp simd reduction(+:sum) + for (int j = 0; j < i; ++j) + sum -= A[i*n + j] * r[j]; + + inai = 1./A[i*n + i]; + w[i] = inai; + r[i] = sum * inai; + } + + #pragma omp simd + for (int i = 0; i < n; ++i) + r[i] *= A[i*n + i]; + + for (int i = n-1; i >= 0; --i) + { + double sum = r[i]; + + #pragma omp simd reduction(+:sum) + for (int j = n-1; j > i; --j) + sum -= A[i*n + j] * r[j]; + + r[i] = sum * w[i]; + } + + #pragma omp simd + for (int i = 0; i < n; i++) + x[i] = x_0[i] + r[i]; + + swap_temp = x; + x = x_0; + x_0 = swap_temp; + } + + if (m % 2 == 0) // Проверил 100 раз + { + #pragma omp simd + for (int i = 0; i < n; i++) + { double temp = x[i]; x[i] = x_0[i]; x_0[i] = temp; } + } else + { double * swap_temp = x; x = x_0; x_0 = swap_temp; } +} diff --git a/2025.03.28/dist/Linux/solve.h b/2025.03.28/dist/Linux/solve.h index 3c2e3ad..c0ff8a5 100644 --- a/2025.03.28/dist/Linux/solve.h +++ b/2025.03.28/dist/Linux/solve.h @@ -11,6 +11,8 @@ void t5_solve(const double * restrict A, double * restrict x_0, const double * r void t6_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, double * restrict r, int n, int m); void t7_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, double * restrict r, int n, int m, double t); void t8_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, double * restrict r, double * restrict w, int n, int m, double t); +void t9_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, int n, int m, double t); +void t10_solve(const double * restrict A, double * restrict x_0, const double * restrict b, double * restrict x, double * restrict r, double * restrict w, int n, int m, double t); #endif