0% found this document useful (0 votes)

45 views19 pages

HPC Programs

The document contains 6 code examples that demonstrate the use of OpenMP for parallel programming in C/C++. Example 1 shows parallelizing a matrix vector multiplication using OpenMP parallel for. Example 2 calculates the sum of array elements in parallel. Example 3 computes Pi in parallel using OpenMP reduction. Example 4 generates Fibonacci numbers in parallel threads. Examples 5 and 6 demonstrate additional uses of OpenMP parallel for and critical sections.

Uploaded by

krishna

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

45 views19 pages

HPC Programs

Uploaded by

krishna

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 19

HPC PROGRAMS

#include <iostream>
#include <stdio.h>
#include <omp.h>

/* Main Program */

int main()
{
int NoofRows, NoofCols, Vectorsize, i, j;
float** Matrix, * Vector, * Result, * Checkoutput;

printf("Read the matrix size noofrows and columns and vectorsize\n");

scanf_s("%d%d%d", &NoofRows, &NoofCols, &Vectorsize);

if (NoofRows <= 0 || NoofCols <= 0 || Vectorsize <= 0) {

printf("The Matrix and Vectorsize should be of positive sign\n");
exit(1);
}
/* Checking For Matrix Vector Computation Necessary Condition */

if (NoofCols != Vectorsize) {
printf("Matrix Vector computation cannot be possible \n");
exit(1);
}
/* Dynamic Memory Allocation And Initialization Of Matrix Elements */

Matrix = (float**)malloc(sizeof(float) * NoofRows);

for (i = 0; i < NoofRows; i++) {
Matrix[i] = (float*)malloc(sizeof(float) * NoofCols);
for (j = 0; j < NoofCols; j++)
Matrix[i][j] = i + j;
}

/* Printing The Matrix */

printf("The Matrix is \n");

for (i = 0; i < NoofRows; i++) {
for (j = 0; j < NoofCols; j++)
printf("%f \t", Matrix[i][j]);
printf("\n");
}

printf("\n");

/* Dynamic Memory Allocation */

Vector = (float)malloc(sizeof(float) Vectorsize);

/* vector Initialization */

for (i = 0; i < Vectorsize; i++)

Vector[i] = i;
printf("\n");

/* Printing The Vector Elements */

printf("The Vector is \n");

for (i = 0; i < Vectorsize; i++)
printf("%f \t", Vector[i]);

/* Dynamic Memory Allocation */

Result = (float)malloc(sizeof(float) NoofRows);

Checkoutput = (float)malloc(sizeof(float) NoofRows);

for (i = 0; i < NoofRows; i = i + 1)

{
Result[i] = 0;
Checkoutput[i] = 0;
}

/* OpenMP Parallel Directive */

#pragma omp parallel for private(j)

for (i = 0; i < NoofRows; i = i + 1)
for (j = 0; j < NoofCols; j = j + 1)
Result[i] = Result[i] + Matrix[i][j] * Vector[j];

/* Serial Computation */

for (i = 0; i < NoofRows; i = i + 1)

for (j = 0; j < NoofCols; j = j + 1)
Checkoutput[i] = Checkoutput[i] + Matrix[i][j] * Vector[j];

for (i = 0; i < NoofRows; i = i + 1)

if (Checkoutput[i] == Result[i])
continue;
else {
printf("There is a difference from Serial and Parallel
Computation \n");
exit(1);
}

printf("\nThe Matrix Computation result is \n");

for (i = 0; i < NoofRows; i++)
printf("%f \n", Result[i]);

/* Freeing The Memory Allocations */

free(Vector);
free(Result);
free(Matrix);
free(Checkoutput);

}
2.

#include <iostream>

#include<stdio.h>
#include<omp.h>

/* Main Program */

int main()
{
float* Array, * Check, serial_sum, sum, partialsum;
int array_size, i;

printf("Enter the size of the array\n");

scanf_s("%d", &array_size);

if (array_size <= 0) {
printf("Array Size Should Be Of Positive Value ");
exit(1);
}
/* Dynamic Memory Allocation */

Array = (float)malloc(sizeof(float) array_size);

Check = (float*)malloc(sizeof(float) * array_size);

/* Array Elements Initialization */

for (i = 0; i < array_size; i++) {

Array[i] = i * 5;
Check[i] = Array[i];
}

printf("The Array Elements Are \n");

for (i = 0; i < array_size; i++)

printf("Array[%d]=%f\n", i, Array[i]);

sum = 0.0;
partialsum = 0.0;

/* OpenMP Parallel For Directive And Critical Section */

#pragma omp parallel for shared(sum)

for (i = 0; i < array_size; i++) {
#pragma omp critical
sum = sum + Array[i];

serial_sum = 0.0;

/* Serail Calculation */
for (i = 0; i < array_size; i++)
serial_sum = serial_sum + Check[i];
if (serial_sum == sum)
printf("\nThe Serial And Parallel Sums Are Equal\n");
else {
printf("\nThe Serial And Parallel Sums Are UnEqual\n");
exit(1);
}

/* Freeing Memory */
free(Check);
free(Array);

printf("\nThe SumOfElements Of The Array Using OpenMP Directives Is %f\n", sum);

printf("\nThe SumOfElements Of The Array By Serial Calculation Is %f\n",
serial_sum);
}

#include <iostream>

#include <omp.h>
#include <stdio.h>
#include <stdlib.h>
#define MAX_THREADS 2

static long steps = 1000000000;

double step;

int main(int argc, const char* argv[]) {

int i, j;
double x;
double pi, sum = 0.0;
double start, delta;

step = 1.0 / (double)steps;

// Compute parallel compute times for 1-MAX_THREADS

for (j = 1; j <= MAX_THREADS; j++) {

printf(" running on %d threads: ", j);

// This is the beginning of a single PI computation

omp_set_num_threads(j);

sum = 0.0;
double start = omp_get_wtime();

#pragma omp parallel for reduction(+:sum) private(x)

for (i = 0; i < steps; i++) {
x = (i + 0.5) * step;
sum += 4.0 / (1.0 + x * x);
}

// Out of the parallel region, finialize computation

pi = step * sum;
delta = omp_get_wtime() - start;
printf("PI = %.16g computed in %.4g seconds\n", pi, delta);

#include <iostream>
#include<stdio.h>
#include<omp.h>

int fib(int n)
{
if (n < 2) return n;
else return fib(n - 1) + fib(n - 2);
}

int main()
{
int fibnumber[100], i, j, n;
printf("Please Enter the series limit\n");
scanf_s("%d", &n);
#pragma omp parallel num_threads(2)
{
#pragma omp critical
if (omp_get_thread_num() == 0)
{
printf("There are %d threads\n", omp_get_num_threads());
printf("Thread %d generating numbers..\n", omp_get_thread_num());
for (i = 0;i < n;i++)
fibnumber[i] = fib(i);
}
else
{
printf("Thread %d Printing numbers..\n", omp_get_thread_num());
for (j = 0;j < n;j++)
printf("%d\t", fibnumber[j]);
}

}
return 0;
}

#include <iostream>
#include <stdio.h>
#include <omp.h>
/* Main Program */

int main()
{
int i, N;
float* array, * check;

/* Size Of An Array */

printf("Enter the size \n");

scanf_s("%d", &N);

if (N <= 0) {
printf("Array Size Should Be Of Postive Sign \n");
exit(1);
}
/* Dynamic Memory Allocation */

array = (float)malloc(sizeof(float) N);

check = (float*)malloc(sizeof(float) * N);

/* Initialization Of Array Elements */

for (i = 0; i < N; i++) {

array[i] = i * 1;
check[i] = i * 1;
}

/* The Input Array Is */

printf("The Input Array Is\n");

for (i = 0; i < N; i++)

printf("%f\t", array[i]);

/* OpenMP Parallel For Directive And Critical Section */

#pragma omp parallel for

for (i = 1; i < N; i++) {
#pragma omp critical
array[i] = (array[i - 1] + array[i]) / 2;
}

/* Serial Calculation */

for (i = 1; i < N; i++)

check[i] = (check[i - 1] + check[i]) / 2;

/* Output Checking */

for (i = 0; i < N; i++) {

if (check[i] == array[i])
continue;
else {
printf("There is a difference in the parallel and serial calculation
\n");
exit(1);
}
}

/* The Final Output */

printf("\nThe Array Calculation Is Same Using Serial And OpenMP Directives\n");

printf("The Output Array Is \n");
for (i = 0; i < N; i++)
printf("\n %f \t", array[i]);

printf("\n");
/* Freeing The Memory */

free(array);
free(check);
}

#include <iostream>
#include <stdio.h>
#include <omp.h>
#define MAXIMUM 65536

/* Main Program */

int main()
{
int* array, i, Noofelements, cur_max, current_value;

printf("Enter the number of elements\n");

scanf_s("%d", &Noofelements);

if (Noofelements <= 0) {
printf("The array elements cannot be stored\n");
exit(1);
}
/* Dynamic Memory Allocation */

array = (int)malloc(sizeof(int) Noofelements);

/* Allocating Random Number Values To The Elements Of An Array */

srand(MAXIMUM);
for (i = 0; i < Noofelements; i++)
array[i] = rand();

if (Noofelements == 1) {
printf("The Largest Number In The Array is %d", array[0]);
exit(1);
}
/* OpenMP Parallel For Directive And Critical Section */

cur_max = 0;
#pragma omp parallel for
for (i = 0; i < Noofelements; i = i + 1) {
if (array[i] > cur_max)
#pragma omp critical
if (array[i] > cur_max)
cur_max = array[i];
}

/* Serial Calculation */

current_value = array[0];
for (i = 1; i < Noofelements; i++)
if (array[i] > current_value)
current_value = array[i];

printf("The Input Array Elements Are \n");

for (i = 0; i < Noofelements; i++)

printf("\t%d", array[i]);

printf("\n");

/* Checking For Output Validity */

if (current_value == cur_max)
printf("\nThe Max Value Is Same From Serial And Parallel OpenMP
Directive\n");
else {
printf("\nThe Max Value Is Not Same In Serial And Parallel OpenMP
Directive\n");
exit(1);
}

/* Freeing Allocated Memory */

printf("\n");
free(array);
printf("\nThe Largest Number In The Given Array Is %d\n", cur_max);
}

#include <iostream>
#include<stdio.h>
#include<omp.h>

/* Main Program */

int main()
{
float* array_A, sum, * checkarray, serialsum;
int arraysize, i, k, Noofthreads;

printf("Enter the size of the array \n");

scanf_s("%d", &arraysize);

if (arraysize <= 0) {
printf("Positive Number Required\n");
exit(1);
}
/* Dynamic Memory Allocation */

array_A = (float)malloc(sizeof(float) arraysize);

checkarray = (float*)malloc(sizeof(float) * arraysize);

for (i = 0; i < arraysize; i++) {

array_A[i] = i + 5;
checkarray[i] = array_A[i];
}

printf("\nThe input array is \n");

for (i = 0; i < arraysize; i++)
printf("%f \t", array_A[i]);

sum = 0.0;

/* OpenMP Parallel For With Reduction Clause */

#pragma omp parallel for reduction(+ : sum)

for (i = 0; i < arraysize; i++)
sum = sum + array_A[i];

/* Serial Calculation */

serialsum = 0.0;
for (i = 0; i < arraysize; i++)
serialsum = serialsum + array_A[i];

/* Output Checking */

if (serialsum != sum) {
printf("\nThe calculation of array sum is different \n");
exit(1);
}
else
printf("\nThe calculation of array sum is same\n");

/* Freeing Memory Which Was Allocated */

free(checkarray);
free(array_A);

printf("The value of array sum using threads is %f\n", sum);

printf("\nThe serial calculation of array is %f\n", serialsum);
}

#include <stdio.h>
#include <mpi.h>
using namespace std;
int main(int argc, char** argv) {
int mynode, totalnodes;
int sum, startval, endval, accum;
MPI_Status status;
MPI_Init(&argc, &argv);
MPI_Comm_size(MPI_COMM_WORLD, &totalnodes);
MPI_Comm_rank(MPI_COMM_WORLD, &mynode);
sum = 0;
startval = 1000 * mynode / totalnodes + 1;
endval = 1000 * (mynode + 1) / totalnodes;
for (int i = startval;i <= endval;i = i + 1)
sum = sum + i;
if (mynode != 0)
MPI_Send(&sum, 1, MPI_INT, 0, 1, MPI_COMM_WORLD);
else
for (int j = 1;j < totalnodes;j = j + 1) {
MPI_Recv(&accum, 1, MPI_INT, j, 1, MPI_COMM_WORLD, &status);
sum = sum + accum;
}
if (mynode == 0)
printf("The sum is %d\n", sum);
MPI_Finalize();
}

#include <iostream>

#include "mpi.h"
#include <math.h>
#include <stdio.h>
void main(int argc, char* argv[])
{
int p, i, Iam, root;
int counts[4] = { 1, 2, 3, 4 };
int displs[4] = { 0, 1, 3, 6 };
char x[10], y[10], a, alphabet;
/*----------------*/
/* initialize MPI */
/*----------------*/

MPI_Init(&argc, &argv);

/*---------------------------*/
/* get the process ID number */
/*---------------------------*/

MPI_Comm_rank(MPI_COMM_WORLD, &Iam);

/*-----------------------------------*/
/* get the size of the process group */
/*-----------------------------------*/

MPI_Comm_size(MPI_COMM_WORLD, &p);
root = 1;
if (Iam == 0) {
printf(" Function Proc Sendbuf Recvbuf\n");
printf(" -------- ---- ------- -------\n");
}
MPI_Barrier(MPI_COMM_WORLD);

for (i = 0; i < p; i++) {

x[i] = ' ';
}

alphabet = 'a';
/*-----------------------------------*/
/* MPI_Gather() */
/*-----------------------------------*/

x[0] = alphabet + Iam;

for (i = 0; i < p; i++) {
y[i] = ' ';
}
MPI_Gather(x, 1, MPI_CHAR, /* send buf,count,type */
y, 1, MPI_CHAR, /* recv buf,count,type */
root, /* root (data origin) */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Gather : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < p; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);
/*-----------------------------------*/
/* MPI_Gatherv() */
/*-----------------------------------*/

for (i = 0; i < 10; i++) {

x[i] = ' ';
y[i] = ' ';
}
for (i = 0; i < counts[Iam]; i++) {
x[i] = alphabet + displs[Iam] + i;
}

MPI_Gatherv(x, counts[Iam], MPI_CHAR, /* send buf,count,type */

y, counts, /* recv buf,count array */
displs, MPI_CHAR, /* displacements,type */
root, /* root (data origin) */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Gatherv : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < 10; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);
/*-----------------------------------*/
/* MPI_Allgather() */
/*-----------------------------------*/

x[0] = alphabet + Iam;

for (i = 0; i < p; i++) {

y[i] = ' ';
}
MPI_Allgather(x, 1, MPI_CHAR, /* send buf,count,type */
y, 1, MPI_CHAR, /* recv buf,count,type */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Allgather : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < p; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);

/*-----------------------------------*/
/* MPI_Allgatherv() */
/*-----------------------------------*/

for (i = 0; i < 10; i++) {

x[i] = ' ';
y[i] = ' ';
}
for (i = 0; i < counts[Iam]; i++) {
x[i] = alphabet + displs[Iam] + i;
}

MPI_Allgatherv(x, counts[Iam], MPI_CHAR, /* send buf,count,type */

y, counts, /* recv buf,count array */
displs, MPI_CHAR, /* displacements,type */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Allgatherv: %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < 10; i++) {
printf(" %c", y[i]);
}
printf("\n");
MPI_Barrier(MPI_COMM_WORLD);

/*-----------------------------------*/
/* MPI_Scatter() */
/*-----------------------------------*/

for (i = 0; i < p; i++) {

x[i] = alphabet + i + Iam * p;
y[i] = ' ';
}
MPI_Scatter(x, 1, MPI_CHAR, /* send buf,count,type */
y, 1, MPI_CHAR, /* recv buf,count,type */
root, /* root (data origin) */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Scatter : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < p; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);

/*-----------------------------------*/
/* MPI_Alltoall() */
/*-----------------------------------*/

for (i = 0; i < p;i++) {

x[i] = alphabet + i + Iam * p;
y[i] = ' ';
}

MPI_Alltoall(x, 1, MPI_CHAR, /* send buf,count,type */

y, 1, MPI_CHAR, /* recv buf,count,type */
MPI_COMM_WORLD); /* comm,flag */

printf(" MPI_Alltoall : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < p; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);

/*-----------------------------------*/
/* MPI_Reduce() */
/*-----------------------------------*/

for (i = 0; i < p; i++) {

x[i] = alphabet + i + Iam * p;
y[i] = ' ';
}
MPI_Reduce(x, y, /* send buf, recv buf */
p, MPI_CHAR, /* count,type */
MPI_MAX, /* operation */
root, /* root (data origin) */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Reduce MAX: %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < p; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);

/*-----------------------------------*/
/* MPI_Allreduce() */
/*-----------------------------------*/

for (i = 0; i < p; i++) {

x[i] = alphabet + i + Iam * p;
y[i] = ' ';
}
MPI_Allreduce(x, y, /* send buf, recv buf */
p, MPI_CHAR, /* count,type */
MPI_MAX, /* operation */
MPI_COMM_WORLD); /* comm */

printf(" MPI_Allreduce : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
for (i = 0; i < p; i++) {
printf(" %c", y[i]);
}
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);

/*-----------------------------------*/
/* MPI_Bcast() */
/*-----------------------------------*/

a = ' ';
for (i = 0; i < p; i++) {
x[i] = ' ';
y[i] = ' ';
}
if (Iam == root) {
a = 'b';
x[0] = a;
}
MPI_Bcast(&a, 1, MPI_CHAR, /* buf,count,type */
root, MPI_COMM_WORLD); /* root,comm */

printf(" MPI_Bcast : %d ", Iam);

for (i = 0; i < p; i++) {
printf(" %c", x[i]);
}
printf(" ");
printf(" %c", a);
printf("\n");

MPI_Barrier(MPI_COMM_WORLD);

/*--------------*/
/* Finalize MPI */
/*--------------*/

MPI_Finalize();
}

10.

#include <iostream>
#include "mpi.h"
#include <stdio.h>

#define SIZE 16
#define UP 0
#define DOWN 1
#define LEFT 2
#define RIGHT 3

int main(int argc, char* argv[])

{
int numtasks, rank, source, dest, outbuf, i, tag = 1,
inbuf[4] = { MPI_PROC_NULL,MPI_PROC_NULL,MPI_PROC_NULL,MPI_PROC_NULL },
nbrs[4], dims[2] = { 4,4 },
periods[2] = { 0,0 }, reorder = 0, coords[2];

MPI_Request reqs[8];
MPI_Status stats[8];
MPI_Comm cartcomm;

/*----------------*/
/* Initialize MPI */
/*----------------*/

MPI_Init(&argc, &argv);

/*-------------------------------------------------------*/
/* Get the size of the MPI_COMM_WORLD communicator group */
/*-------------------------------------------------------*/

MPI_Comm_size(MPI_COMM_WORLD, &numtasks);

if (numtasks == SIZE) {
/*---------------------------------------------------------------------*/
/* Make a new communicator to which 2-D Cartesian topology is attached */
/*---------------------------------------------------------------------*/

MPI_Cart_create(MPI_COMM_WORLD, 2, dims, periods, reorder, &cartcomm);

/*------------------------------------------*/
/* Get my rank in the cartcomm communicator */
/*------------------------------------------*/

MPI_Comm_rank(cartcomm, &rank);

/*--------------------------------------------------------------------*/
/* Determine process coords in cartesian topology given rank in group */
/*--------------------------------------------------------------------*/

MPI_Cart_coords(cartcomm, rank, 2, coords);

/*--------------------------------------------------------------------*/
/* Obtain the shifted source and destination ranks in both directions */
/*--------------------------------------------------------------------*/
MPI_Cart_shift(cartcomm, 0, 1, &nbrs[UP], &nbrs[DOWN]);
MPI_Cart_shift(cartcomm, 1, 1, &nbrs[LEFT], &nbrs[RIGHT]);

outbuf = rank;

for (i = 0; i < 4; i++) {

dest = nbrs[i];
source = nbrs[i];

/*----------------------------------------------*/
/* send messages to the four adjacent processes */
/*----------------------------------------------*/

MPI_Isend(&outbuf, 1, MPI_INT, dest, tag,

MPI_COMM_WORLD, &reqs[i]);

/*---------------------------------------------------*/
/* receive messages from the four adjacent processes */
/*---------------------------------------------------*/

MPI_Irecv(&inbuf[i], 1, MPI_INT, source, tag,

MPI_COMM_WORLD, &reqs[i + 4]);
}

/*------------------------------------------------*/
/* Wait for all 8 communication tasks to complete */
/*------------------------------------------------*/

MPI_Waitall(8, reqs, stats);

printf("rank = %2d coords = %2d%2d neighbors(u,d,l,r) = %2d %2d %2d %2d\n",

rank, coords[0], coords[1], nbrs[UP], nbrs[DOWN], nbrs[LEFT], nbrs[RIGHT]);
printf("rank = %2d inbuf(u,d,l,r) = %2d %2d %2d %2d\n",
rank, inbuf[UP], inbuf[DOWN], inbuf[LEFT], inbuf[RIGHT]);
}
else
printf("Must specify %d processors. Terminating.\n", SIZE);

/*--------------*/
/* Finalize MPI */
/*--------------*/

MPI_Finalize();

11.

#include <iostream>
#include "mpi.h"
#include <stdio.h>
#include <stdlib.h>
#define MASTER 0

int main(int argc, char* argv[])

{
int numtasks, taskid, len, partner, message;
char hostname[MPI_MAX_PROCESSOR_NAME];
MPI_Status status;

MPI_Init(&argc, &argv);
MPI_Comm_rank(MPI_COMM_WORLD, &taskid);
MPI_Comm_size(MPI_COMM_WORLD, &numtasks);

/* need an even number of tasks */

if (numtasks % 2 != 0) {
if (taskid == MASTER)
printf("Quitting. Need an even number of tasks: numtasks=%d\n", numtasks);
}

else {
if (taskid == MASTER)
printf("MASTER: Number of MPI tasks is: %d\n", numtasks);

MPI_Get_processor_name(hostname, &len);
printf("Hello from task %d on %s!\n", taskid, hostname);

/* determine partner and then send/receive with partner */

if (taskid < numtasks / 2) {
partner = numtasks / 2 + taskid;
MPI_Send(&taskid, 1, MPI_INT, partner, 1, MPI_COMM_WORLD);
MPI_Recv(&message, 1, MPI_INT, partner, 1, MPI_COMM_WORLD, &status);
}
else if (taskid >= numtasks / 2) {
partner = taskid - numtasks / 2;
MPI_Recv(&message, 1, MPI_INT, partner, 1, MPI_COMM_WORLD, &status);
MPI_Send(&taskid, 1, MPI_INT, partner, 1, MPI_COMM_WORLD);
}

/* print partner info and exit*/

printf("Task %d is partner with %d\n", taskid, message);
}

MPI_Finalize();

12.

#include <iostream>
#include "mpi.h"
#include <stdio.h>
#include <stdlib.h>
#define MASTER 0

int main(int argc, char* argv[])

{
int numtasks, taskid, len;
char hostname[MPI_MAX_PROCESSOR_NAME];
int partner, message;
MPI_Status stats[2];
MPI_Request reqs[2];

MPI_Init(&argc, &argv);
MPI_Comm_rank(MPI_COMM_WORLD, &taskid);
MPI_Comm_size(MPI_COMM_WORLD, &numtasks);

/* need an even number of tasks */

if (numtasks % 2 != 0) {
if (taskid == MASTER)
printf("Quitting. Need an even number of tasks: numtasks=%d\n", numtasks);
}

else {
MPI_Get_processor_name(hostname, &len);
printf("Hello from task %d on %s!\n", taskid, hostname);
if (taskid == MASTER)
printf("MASTER: Number of MPI tasks is: %d\n", numtasks);

/* determine partner and then send/receive with partner */

if (taskid < numtasks / 2)
partner = numtasks / 2 + taskid;
else if (taskid >= numtasks / 2)
partner = taskid - numtasks / 2;

MPI_Irecv(&message, 1, MPI_INT, partner, 1, MPI_COMM_WORLD, &reqs[0]);

MPI_Isend(&taskid, 1, MPI_INT, partner, 1, MPI_COMM_WORLD, &reqs[1]);

/* now block until requests are complete */

MPI_Waitall(2, reqs, stats);

/* print partner info and exit*/

printf("Task %d is partner with %d\n", taskid, message);
}

MPI_Finalize();
}

Parallel Computing Lab Manual PDF
100% (1)
Parallel Computing Lab Manual PDF
51 pages
DLD Da1
33% (3)
DLD Da1
38 pages
Module 1-Ongoing Maintenance of Computer Systems
No ratings yet
Module 1-Ongoing Maintenance of Computer Systems
12 pages
Band-in-a-Box 2018 Manual PDF
100% (1)
Band-in-a-Box 2018 Manual PDF
665 pages
Lab Programs
No ratings yet
Lab Programs
18 pages
Mathews Mar Athanasius Residential Central School: "Library Management System"
100% (1)
Mathews Mar Athanasius Residential Central School: "Library Management System"
36 pages
Computer Hardware: Parts & Functions
No ratings yet
Computer Hardware: Parts & Functions
34 pages
IDEA StatiCa Licenses Support Error Messages and Tips
No ratings yet
IDEA StatiCa Licenses Support Error Messages and Tips
16 pages
(Easy Money) Easiest Black Hat CPA Method Ever
No ratings yet
(Easy Money) Easiest Black Hat CPA Method Ever
6 pages
Architecting Splunk For High Availability and Disaster Recovery
No ratings yet
Architecting Splunk For High Availability and Disaster Recovery
47 pages
1.10 EEEQ 472 - Address Decoding
No ratings yet
1.10 EEEQ 472 - Address Decoding
14 pages
MY Useful Website List - Sheet1
No ratings yet
MY Useful Website List - Sheet1
5 pages
Technology in Action: Alan Evans Kendall Martin Mary Anne Poatsy Tenth Edition
No ratings yet
Technology in Action: Alan Evans Kendall Martin Mary Anne Poatsy Tenth Edition
86 pages
FDD and TDD PDF
No ratings yet
FDD and TDD PDF
5 pages
Dell Assignment
No ratings yet
Dell Assignment
7 pages
Multicore Architecture and Programming Lab Manual
No ratings yet
Multicore Architecture and Programming Lab Manual
29 pages
Lab Programs
No ratings yet
Lab Programs
15 pages
CP4252 Multicore Architecture and Programming Lab Manual
No ratings yet
CP4252 Multicore Architecture and Programming Lab Manual
26 pages
Operate Personal Computer
No ratings yet
Operate Personal Computer
56 pages
Ultrasonic Sensor and Servo Motor Code
No ratings yet
Ultrasonic Sensor and Servo Motor Code
6 pages
BS 7666-2-2006 - (2018-06-20 - 03-41-10 Am)
No ratings yet
BS 7666-2-2006 - (2018-06-20 - 03-41-10 Am)
30 pages
Nicknames for Gogo ᎶσᎶσ, ░G░O░G░O░, G0G0٨ـﮩﮩـ❤…
No ratings yet
Nicknames for Gogo ᎶσᎶσ, ░G░O░G░O░, G0G0٨ـﮩﮩـ❤…
1 page
Micro
No ratings yet
Micro
30 pages
Characteristics: Enterprise Resource Planning (ERP) Systems Integrate Internal and External
No ratings yet
Characteristics: Enterprise Resource Planning (ERP) Systems Integrate Internal and External
7 pages
Mimix PDF
No ratings yet
Mimix PDF
46 pages
MAP Lab Mannual
No ratings yet
MAP Lab Mannual
24 pages
MPC LAB Manual New
No ratings yet
MPC LAB Manual New
24 pages
CP 4292 MCP Lab Manual
No ratings yet
CP 4292 MCP Lab Manual
20 pages
Lab Manual
No ratings yet
Lab Manual
31 pages
Openmp
No ratings yet
Openmp
18 pages
MAP Lab Completed
No ratings yet
MAP Lab Completed
29 pages
Vector Addition: Exercise 1 (Openmp-I) Scenario - I
100% (1)
Vector Addition: Exercise 1 (Openmp-I) Scenario - I
15 pages
CP4292 Multicore Architecture Lab Manual
No ratings yet
CP4292 Multicore Architecture Lab Manual
36 pages
(Serial)
No ratings yet
(Serial)
8 pages
Multicore
No ratings yet
Multicore
23 pages
HPC Lab Manual 2317 Merged Organized
No ratings yet
HPC Lab Manual 2317 Merged Organized
35 pages
Question 1 - Serial: Output
No ratings yet
Question 1 - Serial: Output
9 pages
CP4292 Mcap
No ratings yet
CP4292 Mcap
24 pages
HPC Printout 1
No ratings yet
HPC Printout 1
22 pages
Cp4292 Multicore Lab Multicore Lab Removed
No ratings yet
Cp4292 Multicore Lab Multicore Lab Removed
37 pages
All HPC Programs
No ratings yet
All HPC Programs
16 pages
20bce2126 PDC Lab Da 3
No ratings yet
20bce2126 PDC Lab Da 3
11 pages
MPC LAB Manual New
No ratings yet
MPC LAB Manual New
23 pages
Lab 3
No ratings yet
Lab 3
23 pages
Mcap-Lab Manual 1
No ratings yet
Mcap-Lab Manual 1
19 pages
Untitled Document
No ratings yet
Untitled Document
23 pages
Excelente
No ratings yet
Excelente
64 pages
Multicore Architecture Lab Manual
No ratings yet
Multicore Architecture Lab Manual
34 pages
PDC-Lab 21BCE10419
No ratings yet
PDC-Lab 21BCE10419
20 pages
CP4292 Mcap
No ratings yet
CP4292 Mcap
15 pages
Assignment 04
No ratings yet
Assignment 04
16 pages
HPC Codes-2
No ratings yet
HPC Codes-2
15 pages
Lab # 2 by Akram
No ratings yet
Lab # 2 by Akram
14 pages
Openmp Lab: Antonio Gómez-Iglesias Agomez@Tacc - Utexas.Edu Texas Advanced Computing Center
No ratings yet
Openmp Lab: Antonio Gómez-Iglesias Agomez@Tacc - Utexas.Edu Texas Advanced Computing Center
17 pages
OpenMP Matrix
No ratings yet
OpenMP Matrix
6 pages
Subject: DSTC++: Unit-I: Above Average Questions Short Questions
No ratings yet
Subject: DSTC++: Unit-I: Above Average Questions Short Questions
7 pages
HPC 3
No ratings yet
HPC 3
7 pages
Pseudo Code of Mpi Programs
No ratings yet
Pseudo Code of Mpi Programs
22 pages
U1 Programa4 S12021
No ratings yet
U1 Programa4 S12021
6 pages
SWE2017 - Lab Assignment 1pages-7
No ratings yet
SWE2017 - Lab Assignment 1pages-7
5 pages
Tp2 - Openmp (Introduction) : Imad Kissami
No ratings yet
Tp2 - Openmp (Introduction) : Imad Kissami
4 pages
Ass3 Edited
No ratings yet
Ass3 Edited
3 pages
17bce0500 VL2019201001477 Ast02 PDF
No ratings yet
17bce0500 VL2019201001477 Ast02 PDF
6 pages
OpenMP Programs
No ratings yet
OpenMP Programs
4 pages
pgm5-7 Ydf
No ratings yet
pgm5-7 Ydf
3 pages
Par - 1 In-Term Exam - Course 2017/18-Q2
No ratings yet
Par - 1 In-Term Exam - Course 2017/18-Q2
7 pages
Parallel and Distributed Computing Lab Digital Assignment - 3
No ratings yet
Parallel and Distributed Computing Lab Digital Assignment - 3
10 pages
Lab 7
No ratings yet
Lab 7
3 pages
Workflows For Depth-Converting KINGDOM Project Data
No ratings yet
Workflows For Depth-Converting KINGDOM Project Data
10 pages
Freeware Antenna Analyzer MMANA
No ratings yet
Freeware Antenna Analyzer MMANA
8 pages
4 Performance.4x
No ratings yet
4 Performance.4x
14 pages
Parallel Computing Assignment: Submitted By: Mariya Idrees (16MCS011) M.Tech (Computer Engineering) Dated 04/05/2017
No ratings yet
Parallel Computing Assignment: Submitted By: Mariya Idrees (16MCS011) M.Tech (Computer Engineering) Dated 04/05/2017
2 pages
Practice OpenMP
No ratings yet
Practice OpenMP
2 pages
Exercise 1 (Openmp-I)
No ratings yet
Exercise 1 (Openmp-I)
10 pages
As 3
No ratings yet
As 3
2 pages
Fork Dash
No ratings yet
Fork Dash
8 pages
LocusIT - Corporate Profile
No ratings yet
LocusIT - Corporate Profile
10 pages
(SOLVED) Trend Micro OfficeScan Install Issues - Antivirus - Spiceworks
No ratings yet
(SOLVED) Trend Micro OfficeScan Install Issues - Antivirus - Spiceworks
2 pages
Cse 4001-Parallel and Distributed Computing Lab Digital Assessment-1 Name: Avulapati Anusha REG - NO: 17BCE0435
No ratings yet
Cse 4001-Parallel and Distributed Computing Lab Digital Assessment-1 Name: Avulapati Anusha REG - NO: 17BCE0435
5 pages
Name: Harshvardhan Singh Gahlaut Reg. No.: 19BCE2372 Slot: L41+L42
No ratings yet
Name: Harshvardhan Singh Gahlaut Reg. No.: 19BCE2372 Slot: L41+L42
3 pages
Apfs Stats
No ratings yet
Apfs Stats
11 pages
E 3 (Openmp - Iii) : Matrix Multiplication
No ratings yet
E 3 (Openmp - Iii) : Matrix Multiplication
10 pages
TLC0834C, TLC0834I, TLC0838C, TLC0838I 8-Bit Analog-To-Digital Converters With Serial Control
No ratings yet
TLC0834C, TLC0834I, TLC0838C, TLC0838I 8-Bit Analog-To-Digital Converters With Serial Control
14 pages
5th Sem Syllabus Autonomy
No ratings yet
5th Sem Syllabus Autonomy
28 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
150+ C Pattern Programs
From Everand
150+ C Pattern Programs
Hernando Abella
No ratings yet
C Language Programming Codes
From Everand
C Language Programming Codes
Durgesh
No ratings yet
Airtel Store in Manchester - Google Search
No ratings yet
Airtel Store in Manchester - Google Search
1 page
Global Transitions Proceedings: B Varshini, HR Yogesh, Syed Danish Pasha, Maaz Suhail, V Madhumitha, Archana Sasi
No ratings yet
Global Transitions Proceedings: B Varshini, HR Yogesh, Syed Danish Pasha, Maaz Suhail, V Madhumitha, Archana Sasi
9 pages

HPC Programs

Uploaded by

HPC Programs

Uploaded by

HPC PROGRAMS

printf("Read the matrix size noofrows and columns and vectorsize\n");

if (NoofRows <= 0 || NoofCols <= 0 || Vectorsize <= 0) {

Matrix = (float**)malloc(sizeof(float) * NoofRows);

/* Printing The Matrix */

printf("The Matrix is \n");

/* Dynamic Memory Allocation */

Vector = (float*)malloc(sizeof(float) * Vectorsize);

for (i = 0; i < Vectorsize; i++)

/* Printing The Vector Elements */

printf("The Vector is \n");

/* Dynamic Memory Allocation */

Result = (float*)malloc(sizeof(float) * NoofRows);

Checkoutput = (float*)malloc(sizeof(float) * NoofRows);

for (i = 0; i < NoofRows; i = i + 1)

/* OpenMP Parallel Directive */

#pragma omp parallel for private(j)

for (i = 0; i < NoofRows; i = i + 1)

for (i = 0; i < NoofRows; i = i + 1)

printf("\nThe Matrix Computation result is \n");

/* Freeing The Memory Allocations */

printf("Enter the size of the array\n");

Array = (float*)malloc(sizeof(float) * array_size);

/* Array Elements Initialization */

for (i = 0; i < array_size; i++) {

printf("The Array Elements Are \n");

for (i = 0; i < array_size; i++)

/* OpenMP Parallel For Directive And Critical Section */

#pragma omp parallel for shared(sum)

printf("\nThe SumOfElements Of The Array Using OpenMP Directives Is %f\n", sum);

static long steps = 1000000000;

int main(int argc, const char* argv[]) {

step = 1.0 / (double)steps;

// Compute parallel compute times for 1-MAX_THREADS

printf(" running on %d threads: ", j);

// This is the beginning of a single PI computation

#pragma omp parallel for reduction(+:sum) private(x)

// Out of the parallel region, finialize computation

printf("Enter the size \n");

array = (float*)malloc(sizeof(float) * N);

/* Initialization Of Array Elements */

for (i = 0; i < N; i++) {

/* The Input Array Is */

for (i = 0; i < N; i++)

/* OpenMP Parallel For Directive And Critical Section */

#pragma omp parallel for

for (i = 1; i < N; i++)

for (i = 0; i < N; i++) {

/* The Final Output */

printf("\nThe Array Calculation Is Same Using Serial And OpenMP Directives\n");

printf("Enter the number of elements\n");

array = (int*)malloc(sizeof(int) * Noofelements);

/* Allocating Random Number Values To The Elements Of An Array */

printf("The Input Array Elements Are \n");

for (i = 0; i < Noofelements; i++)

/* Checking For Output Validity */

/* Freeing Allocated Memory */

printf("Enter the size of the array \n");

array_A = (float*)malloc(sizeof(float) * arraysize);

for (i = 0; i < arraysize; i++) {

printf("\nThe input array is \n");

/* OpenMP Parallel For With Reduction Clause */

#pragma omp parallel for reduction(+ : sum)

/* Freeing Memory Which Was Allocated */

printf("The value of array sum using threads is %f\n", sum);

for (i = 0; i < p; i++) {

x[0] = alphabet + Iam;

printf(" MPI_Gather : %d ", Iam);

for (i = 0; i < 10; i++) {

MPI_Gatherv(x, counts[Iam], MPI_CHAR, /* send buf,count,type */

printf(" MPI_Gatherv : %d ", Iam);

x[0] = alphabet + Iam;

for (i = 0; i < p; i++) {

printf(" MPI_Allgather : %d ", Iam);

for (i = 0; i < 10; i++) {

MPI_Allgatherv(x, counts[Iam], MPI_CHAR, /* send buf,count,type */

Vector = (float)malloc(sizeof(float) Vectorsize);

Result = (float)malloc(sizeof(float) NoofRows);

Checkoutput = (float)malloc(sizeof(float) NoofRows);

Array = (float)malloc(sizeof(float) array_size);

array = (float)malloc(sizeof(float) N);

array = (int)malloc(sizeof(int) Noofelements);

array_A = (float)malloc(sizeof(float) arraysize);