sheet 5

2025-12-10 17:13:48 +01:00 · 2025-12-10 17:13:48 +01:00 · 71c9d9b858
commit 71c9d9b858
parent 4141f31f0c
4 changed files with 1434 additions and 0 deletions
--- a/Sheet_5/bsp_5_4/Makefile
+++ b/Sheet_5/bsp_5_4/Makefile
@ -0,0 +1,30 @@
+#
+# use GNU-Compiler tools
+COMPILER=GCC_
+# alternatively from the shell
+# export COMPILER=GCC_
+# or, alternatively from the shell
+# make COMPILER=GCC_
+
+# use Intel compilers
+#COMPILER=ICC_
+
+# use PGI compilers
+# COMPILER=PGI_
+
+
+SOURCES = main.cpp bsp_3_lib_bench_par.cpp
+OBJECTS = $(SOURCES:.cpp=.o)
+
+PROGRAM	= main.${COMPILER}
+
+# uncomment the next to lines for debugging and detailed performance analysis
+CXXFLAGS += -g
+LINKFLAGS += -g
+# do not use -pg with PGI compilers
+
+ifndef COMPILER
+  COMPILER=GCC_
+endif
+
+include ../${COMPILER}default.mk
--- a/Sheet_5/bsp_5_4/bsp_3_lib_bench_par.cpp
+++ b/Sheet_5/bsp_5_4/bsp_3_lib_bench_par.cpp
--- a/Sheet_5/bsp_5_4/bsp_3_lib_bench_par.h
+++ b/Sheet_5/bsp_5_4/bsp_3_lib_bench_par.h
@ -0,0 +1,288 @@
+#pragma once
+
+#include <omp.h>
+#include <vector>
+
+/** 	Inner product
+	@param[in] x	vector
+	@param[in] y	vector
+	@return 	    resulting Euclidean inner product <x,y>
+*/
+double scalar(std::vector<double> const &x, std::vector<double> const &y);
+
+/** 	Inner product - parallel
+	@param[in] x	vector
+	@param[in] y	vector
+	@return 	    resulting Euclidean inner product <x,y>
+*/
+double scalar_par(std::vector<double> const &x, std::vector<double> const &y);
+
+
+/** 	Inner product with cblas
+	@param[in] x	vector
+	@param[in] y	vector
+	@return 	    resulting Euclidean inner product <x,y>
+*/
+double scalar_cblas(std::vector<double> const &x, std::vector<double> const &y);
+
+
+/** 	Inner product with Kahan summation
+	@param[in] x	vector
+	@param[in] y	vector
+	@return 	    resulting Euclidean inner product <x,y>
+*/
+double scalar_kahan(std::vector<double> const &x, std::vector<double> const &y);
+
+
+/** 	euclidean norm
+	@param[in] x	vector
+	@return 	    resulting Euclidean norm
+*/
+double norm_eucl(std::vector<double> const &x);
+
+
+/** 	sum of vector
+	@param[in] x	vector
+	@return 	    sum of the vector elements
+*/
+double sum(std::vector<double> const &x);
+
+
+/** 	sum of vector - parallel
+	@param[in] x	vector
+	@return 	    sum of the vector elements
+*/
+double sum_par(std::vector<double> const &x);
+
+
+/** \brief Matrix-Vektor-Multiplikation (row-wise access)
+ *
+ * \param[in]   a   Matrix with row wise access
+ * \param[in]   x   vector which gets multiplied
+ * \return          resulting product a*x (vector)
+ *
+ */
+std::vector<double> MatVec(std::vector<double> const & a, std::vector<double> const & x);
+
+
+/** \brief Matrix-Vektor-Multiplikation (row-wise access) - parallel
+ *
+ * \param[in]   a   Matrix with row wise access
+ * \param[in]   x   vector which gets multiplied
+ * \return          resulting product a*x (vector)
+ *
+ */
+std::vector<double> MatVec_par(std::vector<double> const & a, std::vector<double> const & x);
+
+
+/** \brief Matrix-Vektor-Multiplikation mit cblas (row-wise access)
+ *
+ * \param[in]   a   Matrix with row wise access
+ * \param[in]   x   vector which gets multiplied
+ * \return          resulting product a*x (vector)
+ *
+ */
+std::vector<double> MatVec_cblas(std::vector<double> const & a, std::vector<double> const & x);
+
+
+/** \brief Matrix-Vektor-Multiplikation (column-wise access)
+ *
+ * \param[in]   a   Matrix with row wise access
+ * \param[in]   x   vector which gets multiplied
+ * \return          resulting product a*x (vector)
+ *
+ */
+std::vector<double> MatVec_column(std::vector<double> const & a, std::vector<double> const & x);
+
+
+/** \brief Matrix-Matrix-Multiplikation (row-wise access)
+ *
+ * \param[in]   a   matrix with row wise access (M*L)
+ * \param[in]   b   matrix with row wise access (L*N)
+ * \param[in]   L   inner dimension of the matrix product
+ * \return          resulting product a*b
+ *
+ */
+std::vector<double> MatMatProd(std::vector<double> const & a, std::vector<double> const & b, int const & L);
+
+
+/** \brief Matrix-Matrix-Multiplikation (row-wise access) - parallel
+ *
+ * \param[in]   a   matrix with row wise access (M*L)
+ * \param[in]   b   matrix with row wise access (L*N)
+ * \param[in]   L   inner dimension of the matrix product
+ * \return          resulting product a*b
+ *
+ */
+std::vector<double> MatMatProd_par(std::vector<double> const & a, std::vector<double> const & b, int const & L);
+
+
+/** \brief Matrix-Matrix-Multiplikation mit cblas (row-wise access)
+ *
+ * \param[in]   a   matrix with row wise access (M*L)
+ * \param[in]   b   matrix with row wise access (L*N)
+ * \param[in]   L   inner dimension of the matrix product
+ * \return          resulting product a*b
+ *
+ */
+std::vector<double> MatMatProd_cblas(std::vector<double> const & a, std::vector<double> const & b, int const & L);
+
+
+/** \brief Polynomauswertung an Stelle x
+ *
+ * \param[in]   a   Vekor mit den Koeffizienten des Polynoms a=[a0,a1,a2,...]
+ * \param[in]   x   Vektor, für welchen das Polynom ausgewertet werden soll
+ * \return          resulting vector p(x)
+ *
+ */
+std::vector<double> PolynomEval(std::vector<double> const & a, std::vector<double> const & x);
+
+
+/** \brief Polynomauswertung an Stelle x - parallel
+ *
+ * \param[in]   a   Vekor mit den Koeffizienten des Polynoms a=[a0,a1,a2,...]
+ * \param[in]   x   Vektor, für welchen das Polynom ausgewertet werden soll
+ * \return          resulting vector p(x)
+ *
+ */
+std::vector<double> PolynomEval_par(std::vector<double> const & a, std::vector<double> const & x);
+
+
+/** \brief Benchmarking A - the scalar product
+ *
+ * \param   N   size of the vector
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_A(int const & N, int const & Nloops);
+
+
+/** \brief Benchmarking A - the scalar product with cblas
+ *
+ * \param   N   size of the vector
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_A_cblas(int const & N, int const & Nloops);
+
+
+
+/** \brief Benchmarking A - the scalar product with Kahan summation
+ *
+ * \param   N   size of the vector
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_A_kahan(int const & N, int const & Nloops);
+
+
+/** \brief Benchmarking A - norm
+ *
+ * \param   N   size of the vector
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_A_norm(int const & N, int const & Nloops);
+
+
+/** \brief Benchmarking B - matrix-vector product Ax=b (row wise access)
+ *
+ * \param   N   size of vector x
+ * \param   M   size of vector b (=> A: M*N)
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_B(int const & N, int const & M, int const & Nloops);
+
+
+/** \brief Benchmarking B - matrix-vector product Ax=b (row wise access) [parallel]
+ *
+ * \param   N   size of vector x
+ * \param   M   size of vector b (=> A: M*N)
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_B_par(int const & N, int const & M, int const & Nloops);
+
+
+/** \brief Benchmarking B - matrix-vector product Ax=b with cblas (row wise access)
+ *
+ * \param   N   size of vector x
+ * \param   M   size of vector b (=> A: M*N)
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_B_cblas(int const & N, int const & M, int const & Nloops);
+
+
+/** \brief Benchmarking B - matrix-vector product Ax=b (column wise access)
+ *
+ * \param   N   size of vector x
+ * \param   M   size of vector b (=> A: M*N)
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_B_column(int const & N, int const & M, int const & Nloops);
+
+
+/** \brief Benchmarking C - Matrix-Matrix product C=A*B A_M*L, B_L*N
+ *
+ * \param   N
+ * \param   M
+ * \param   L
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_C(int const & N, int const & M, int const & L, int const & Nloops);
+
+
+/** \brief Benchmarking C - Matrix-Matrix product C=A*B A_M*L, B_L*N [parallel]
+ *
+ * \param   N
+ * \param   M
+ * \param   L
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_C_par(int const & N, int const & M, int const & L, int const & Nloops);
+
+
+/** \brief Benchmarking C - Matrix-Matrix product with cblas; C=A*B A_M*L, B_L*N
+ *
+ * \param   N
+ * \param   M
+ * \param   L
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_C_cblas(int const & N, int const & M, int const & L, int const & Nloops);
+
+
+/** \brief Benchmarking D - polynomial evaluation
+ *
+ * \param   p   the degree of the polynomial
+ * \param   N   size of the input vector x where p(x)
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_D(int const & p, int const & N, int const & Nloops);
+
+
+/** \brief Benchmarking D - polynomial evaluation [parallel]
+ *
+ * \param   p   the degree of the polynomial
+ * \param   N   size of the input vector x where p(x)
+ * \param   Nloops  number of iterations we want to do for the measuring
+ *
+ */
+void benchmark_D_par(int const & p, int const & N, int const & Nloops);
+
+
+/** \brief solving system of linear equations with time measurement
+ *
+ * \param   N   size of the system Ax=b with A(nxn)
+ * \param	nrhs	number of right hand sides b(nxnrhs)
+ *
+ */
+void solver(int const & N, int const & nrhs);
+
--- a/Sheet_5/bsp_5_4/main.cpp
+++ b/Sheet_5/bsp_5_4/main.cpp
@ -0,0 +1,47 @@
+#include "bsp_3_lib_bench_par.h"
+#include <cmath>
+#include <iostream>
+
+using namespace std;
+
+int main()
+{
+    benchmark_B(8000,8000,400);
+    benchmark_B_par(8000,8000,400);
+    benchmark_C(4000,4000,4000,1);
+    benchmark_C_par(4000,4000,4000,1);
+    benchmark_D(1e4,1e5,15);
+    benchmark_D_par(1e4,1e5,15);
+    
+    // comparing the time for sum and inner product with and without parallelization
+    cout << "\nComparing the runtime (in sec) for inner product and sum with and without parallelization\n\n";
+    for(int k=3; k<=8; ++k)
+    {
+		
+		int N = pow(10,k);
+		cout << "k = " << k << "	N = " << N << endl;
+		vector<double> v1(N,1.0/N);
+		vector<double> v2(N,N);
+		
+		auto tstart = omp_get_wtime();
+		double s = scalar(v1, v2);		
+		auto t_diff_scalar = omp_get_wtime() - tstart;
+		
+		tstart = omp_get_wtime();
+		double sp = scalar_par(v1, v2);		
+		auto t_diff_scalar_par = omp_get_wtime() - tstart;
+		
+		tstart = omp_get_wtime();
+		double su = sum(v1);		
+		auto t_diff_sum = omp_get_wtime() - tstart;
+		
+		tstart = omp_get_wtime();
+		double sup = sum_par(v1);		
+		auto t_diff_sum_par = omp_get_wtime() - tstart;
+		
+		cout << "sum	" << t_diff_sum << "	inner_prod	" << t_diff_scalar << endl;
+		cout << "sum_par	" << t_diff_sum_par << "	inner_prod_par	" << t_diff_scalar_par << endl << endl;;
+	}
+
+    return 0;
+}