WHY STUDENT PREFER US?

4.9/5

5 Star Rating

93940

Orders Deliver

3949

PhD Experts

24x7

Support

100%

Privacy

100%

Top Quality

/ Samples /
computer-science-histogram-algorithm-using-mpi-and-openmpi /
Computer Science Histogram Algorithm Using Mpi and Openmpi

Sample Details

Computer Science Histogram Algorithm Using Mpi and Openmpi

Number Of View : 328

Download : 0

Pages: 9

Words : 2197

Question :

This is coding assignment. Need to implement 3 functions for Parallel sorting using Histogram algoritham using MPI and OpenMPI and c++.

Answer :

#include "solution.h"

#include

#include

#include

#include

#include

#include

#include "basic_defs.h"

#include "databasics.h"

MPI_Datatype dtype = MPI_UNSIGNED_LONG_LONG;

// Get midpoint of two numbers

uint64_t getMid(const uint64_t &a, const uint64_t &b) {

uint64_t ans = a / 2 + b / 2;

if (((a % 2) + (b % 2)) == 2) ans++;

return ans;

}

// Find the number of items in sorted data which are less than equal to key

uint64_t getHist(const dist_sort_t *data, const dist_sort_size_t n,

const dist_sort_t key) {

uint64_t a, b, mid;

a = 0;

b = n;

while (b > a) {

mid = getMid(a, b);

if (key == data[mid])

break;

else if (key < data[mid])

b = mid;

else

a = mid + 1;

}

return mid + 1;

}

// Check if the hist is valid splitter, if it is then return the splitter index

uint64_t idealSplitter(dist_sort_size_t dataPerProc, dist_sort_t hist) {

uint64_t thresh = dataPerProc / 200;

uint64_t offset = hist % dataPerProc;

// printf("hist: %lu, offset: %lu, threash: %lu\n", hist, offset, thresh);

if (offset < thresh) {

return (int)(hist / dataPerProc) - 1;

} else if ((dataPerProc - offset) < thresh) {

return hist / dataPerProc;

} else

return -1;

}

void rebalance(const dist_sort_t *data, const dist_sort_size_t myDataCount,

dist_sort_t **rebalancedData, dist_sort_size_t *rCount) {

// Get number of processes

int nProcs;

MPI_Comm_size(MPI_COMM_WORLD, &nProcs);

// Get rank of the process

int rank;

MPI_Comm_rank(MPI_COMM_WORLD, &rank);

dist_sort_size_t global_N;

// Perform MPI all reduce to sum up all local_N's and get global_N

MPI_Allreduce(&myDataCount, &global_N, 1, dtype, MPI_SUM, MPI_COMM_WORLD);

uint64_t dataPerProc, limit;

// Datacount per process

dataPerProc = global_N / nProcs;

// no of processes with extra data

limit = global_N % nProcs;

// if (rank == 0)

// printf("limit %lu, dataperproc %lu, global %lu\n", limit, dataPerProc,

// global_N);

// assign datasize for curr process

dist_sort_size_t myCount = dataPerProc + (rank < limit ? 1 : 0);

// allocate array for output

dist_sort_t *balanced =

(dist_sort_t *)malloc(myCount * sizeof(dist_sort_t));

// Global starting and ending index of this rank

uint64_t myStartGlobal, myEnd;

MPI_Exscan(&myDataCount, &myStartGlobal, 1, dtype, MPI_SUM, MPI_COMM_WORLD);

if (rank == 0) myStartGlobal = 0;

myEnd = myStartGlobal + myDataCount - 1;

MPI_Win win;

// create window for one way communication

MPI_Win_create(balanced, myCount * sizeof(dist_sort_t), sizeof(dist_sort_t),

MPI_INFO_NULL, MPI_COMM_WORLD, &win);

MPI_Win_fence(MPI_MODE_NOPRECEDE, win);

uint64_t next = myStartGlobal;

while (next <= myEnd) {

uint64_t destProcs = dataPerProc + 1; // data count in destination rank

uint64_t dest = next / destProcs; // destination rank

uint64_t disp; // offset in destination rank

uint64_t size; // size to write to destination rank

if (!(dest < limit)) {

dest = (next - limit) / --destProcs;

disp = (next - limit) % destProcs;

size = std::min(destProcs * (dest + 1), myEnd + 1) - (next - limit);

} else {

disp = next % destProcs;

size = std::min(destProcs * (dest + 1), myEnd + 1) - next;

}

// printf("\ndest %lu, next %lu\n", dest, next);

// writing to destination rank

MPI_Put(&data[next - myStartGlobal], size, dtype, dest, disp, size,

dtype, win);

next += size;

}

MPI_Win_fence(0, win);

MPI_Win_fence(MPI_MODE_NOSUCCEED, win);

// assigning rebalanced data

*rebalancedData = balanced;

*rCount = myCount;

}

void findSplitters(const dist_sort_t *data, const dist_sort_size_t data_size,

dist_sort_t *splitters, dist_sort_size_t *counts,

int numSplitters) {

// Get number of processes

int nProcs;

MPI_Comm_size(MPI_COMM_WORLD, &nProcs);

// Get rank of the process

int rank;

MPI_Comm_rank(MPI_COMM_WORLD, &rank);

dist_sort_size_t global_N;

// Perform MPI all reduce to sum up all local_N's and get global_N

MPI_Allreduce(&data_size, &global_N, 1, dtype, MPI_SUM, MPI_COMM_WORLD);

uint64_t dataPerProc;

// Datacount per process

dataPerProc = global_N / nProcs;

// number of probes to use

uint64_t k = 1000 * numSplitters;

// number of unsatisfied splitters

uint64_t splittersLeft = numSplitters;

dist_sort_size_t prefixCounts[numSplitters];

// assigning final splitter

splitters[numSplitters - 1] = DIST_SORT_MAX;

prefixCounts[numSplitters - 1] = global_N;

// indicates satisfied splitters

bool selected[numSplitters];

splittersLeft--;

#pragma omp parallel for

for (int i = 0; i < numSplitters - 1; i++) {

selected[i] = false;

}

selected[numSplitters - 1] = true;

// keys for probes

dist_sort_t probes[k];

// local histogram and global histogram

dist_sort_t localHist[k], globalHist[k];

if (0 == rank)

// initialise probes

#pragma omp parallel for

for (int i = 0; i < k; i++)

probes[i] = (DIST_SORT_MAX / (k + 1)) * (i + 1);

while (splittersLeft) {

// printf("%ld ", splittersLeft);

MPI_Barrier(MPI_COMM_WORLD);

// send selected probes to all ranks

MPI_Bcast(probes, k, dtype, 0, MPI_COMM_WORLD);

#pragma omp parallel for

for (int i = 0; i < k; i++) {

// calculate histogram for all probes

localHist[i] = getHist(data, data_size, probes[i]);

// printf("rank: %d, localhist: %lu\n", rank, localHist[i]);

}

MPI_Barrier(MPI_COMM_WORLD);

// calculate global histogram for all probes

MPI_Reduce(&localHist, &globalHist, k, dtype, MPI_SUM, 0,

MPI_COMM_WORLD);

// int x;

// std::cin >> x;

if (0 == rank) {

#pragma omp parallel for

for (int i = 0; i < k; i++) {

int64_t idx = idealSplitter(dataPerProc, globalHist[i]);

// std::cout << idx << std::endl;

// std::cout << (idx > -1) << std::endl;

// if (idx > -1) std::cout << splitters[idx] << std::endl;

// std::cin >> x;

// for each probe check if it is satisfied splitter

if (idx > -1 && !selected[idx]) {

// printf("selected\n");

splitters[idx] = probes[i];

prefixCounts[idx] = globalHist[i];

selected[idx] = true;

}

}

splittersLeft = 0;

for (int i = 0; i < numSplitters; i++)

if (!selected[i]) splittersLeft++;

if (splittersLeft) {

// if splitters are left unsatisfied, get new set of probes

int a = -1, probeIdx = 0;

bool running = false;

for (int i = 0; i < numSplitters; i++) {

if (running) {

if (splitters[i] != -1) {

int numProbes = (i - a - 1) / splittersLeft * k;

dist_sort_t start = (a == -1) ? 0 : splitters[a];

dist_sort_t end = splitters[i];

for (int j = 0; j < numProbes && probeIdx < k;

j++, probeIdx++) {

probes[probeIdx] = start + (end - start) /

(numProbes + 1) *

(j + 1);

}

running = false;

a = i;

}

} else {

if (splitters[i] != -1) {

a = i;

} else {

running = true;

}

}

}

}

}

MPI_Barrier(MPI_COMM_WORLD);

// send unsatisfied splitters count to all ranks

MPI_Bcast(&splittersLeft, 1, dtype, 0, MPI_COMM_WORLD);

}

if (0 == rank) {

// printf("nloops: %d\n", nloops);

// set counts for each bin

#pragma omp parallel for

for (int i = numSplitters - 1; i > 0; i--) {

counts[i] = prefixCounts[i] - prefixCounts[i - 1];

}

counts[0] = prefixCounts[0];

}

MPI_Barrier(MPI_COMM_WORLD);

// send splitters to each rank

MPI_Bcast(splitters, numSplitters, dtype, 0, MPI_COMM_WORLD);

MPI_Barrier(MPI_COMM_WORLD);

// send count to each rank

MPI_Bcast(counts, numSplitters, dtype, 0, MPI_COMM_WORLD);

}

void moveData(const dist_sort_t *const sendData,

const dist_sort_size_t sDataCount, dist_sort_t **recvData,

dist_sort_size_t *rDataCount, const dist_sort_t *const splitters,

const dist_sort_t *const counts, int numSplitters) {

// Get number of processes

int nProcs;

MPI_Comm_size(MPI_COMM_WORLD, &nProcs);

// Get rank of the process

int rank;

MPI_Comm_rank(MPI_COMM_WORLD, &rank);

// number of local data points in each bin

dist_sort_size_t bins[numSplitters], prefixBins[numSplitters];

#pragma omp parallel for

for (int i = 0; i < numSplitters; i++)

prefixBins[i] = getHist(sendData, sDataCount, splitters[i]);

#pragma omp parallel for

for (int i = numSplitters - 1; i > 0; i--)

bins[i] = prefixBins[i] - prefixBins[i - 1];

bins[0] = prefixBins[0];

// number of datapoints before this rank for each bin

dist_sort_size_t myStartGlobal[numSplitters];

MPI_Exscan(&bins, &myStartGlobal, numSplitters, dtype, MPI_SUM,

MPI_COMM_WORLD);

if (rank == 0)

#pragma omp parallel for

for (int i = 0; i < numSplitters; i++) myStartGlobal[i] = 0;

*recvData = (dist_sort_t *)malloc(counts[rank] * sizeof(dist_sort_t));

*rDataCount = counts[rank];

MPI_Win win;

MPI_Win_create(*recvData, counts[rank] * sizeof(dist_sort_t),

sizeof(dist_sort_t), MPI_INFO_NULL, MPI_COMM_WORLD, &win);

MPI_Win_fence(MPI_MODE_NOPRECEDE, win);

uint64_t start = 0;

for (int i = 0; i < numSplitters; i++) {

uint64_t size = bins[i];

// send data to respective rank

MPI_Put(&sendData[start], size, dtype, i, myStartGlobal[i], size, dtype,

win);

start += bins[i];

}

MPI_Win_fence(0, win);

MPI_Win_fence(MPI_MODE_NOSUCCEED, win);

}

void sort(dist_sort_t *data, dist_sort_size_t size) {

// You are welcome to use this sort function.

// If you wish to implement your own, you can do that too.

// Don't use bubblesort.

std::sort(data, data + size);

}

Place Order For A Top Grade Assignment Now

We have some amazing discount offers running for the students

Order Now

Get Help Instantly

Email:

Subject:

Deadline:

Pages:

FREE FEATURES

Limitless Amendments

~~$09.50~~ free

Bibliography

~~$10.50~~ free

Outline

~~$05.00~~ free

Title page

~~$07.50~~ free

Formatting

~~$07.50~~ free

Plagiarism Report

~~$10.00~~ free

Get all these features for ~~$50.00~~

free

Order Now

Select the Best Assignment Helpers in Subject

Hire Postgraduate Subject Matter Experts from Top Universities.

Dr. Emily Davis image

Dr. Emily Davis

Ph.D in Political Science

PhD in Political Science, Harvard University. She specializes in international relations and political theory.

Orders 657

Success rate 99%

Reviews 165

Hire Writer

Dr. Sophie Williams image

Dr. Sophie Williams

Ph.D in History

PhD in History, University of Oxford. She specializes in medieval history and historical archives.

Orders 510

Success rate 99%

Reviews 89

Hire Writer

Dr. Emma Thompson image

Dr. Emma Thompson

Ph.D in Biology

PhD in Marine Biology, University of Sydney. Expertise in coral reef ecosystems and marine conservation.

Orders 521

Success rate 99%

Reviews 63

Hire Writer

Prof. Conor Kelly image

Prof. Conor Kelly

Ph.D in Law

PhD in Law, University College Cork. He is an expert in international law and human rights.

Orders 699

Success rate 99%

Reviews 105

Hire Writer

Latest Blog Boost your grades with expert tips and tricks from our academic blog.

How to Score the Best Grades in any Academic Writing

Finding out how to score the best grades in any academic writing will be helpful to you. First, understand the requirements. Then, conduct extensive research, […]

Understand How to Write a Cover Page for an Essay

Learning how to write a cover page for an essay will help you make a good impression. To do it well, centre the essay title […]

Understand the Differences between Speeches and Essays

Understanding the differences between speeches and essays will help you tailor your message and communicate effectively. Speeches are spoken words that connect with listeners directly. […]

View More Blogs

Let's Talk

Enter your email, and we shall get back to you in an hour.