hpc_reduction

#include <limits.h>
#include <omp.h>
#include <stdlib.h>
#include <array>
#include <chrono>
#include <functional>
#include <iostream>
#include <string>
#include <vector>
using std::chrono::duration_cast;
using std::chrono::high_resolution_clock;
using std::chrono::milliseconds;
using namespace std;

void s_avg(int arr[], int n)
{
    long sum = 0L;
    int i;
    for (i = 0; i < n; i++)
    {
        sum = sum + arr[i];
    }
    cout <<"sequential average: "<<sum / long(n);
}
void p_avg(int arr[], int n)
{
    long sum = 0L;
    int i;
    #pragma omp parallel for reduction(+ : sum) num_threads(16)
    for (i = 0; i < n; i++)
    {
        sum = sum + arr[i];
    }
    cout <<"parallel average: "<<sum / long(n);
}
void s_sum(int arr[], int n)
{
    long sum = 0L;
    int i;
    for (i = 0; i < n; i++)
    {
        sum = sum + arr[i];
    }
    cout <<"sequential sum: "<<sum;
}

void p_sum(int arr[], int n)
{
    long sum = 0L;
    int i;
    #pragma omp parallel for reduction(+ : sum) num_threads(16)
    for (i = 0; i < n; i++)
    {
        sum = sum + arr[i];
    }
    cout <<"parallel sum: "<<sum;
}
void s_max(int arr[], int n)
{
    int max_val = INT_MIN;
    int i;
    for (i = 0; i < n; i++)
    {
        if (arr[i] > max_val)
        {
            max_val = arr[i];
        }
    }
    cout <<"sequential max: "<<max_val;
}

void p_max(int arr[], int n)
{
    int max_val = INT_MIN;
    int i;
    #pragma omp parallel for reduction(max : max_val) num_threads(16)
    for (i = 0; i < n; i++)
    {
        if (arr[i] > max_val)
        {
            max_val = arr[i];
        }
    }
    cout <<"parallel max: "<<max_val;
}
void s_min(int arr[], int n)
{
    int min_val = INT_MAX;
    int i;
    for (i = 0; i < n; i++)
    {
        if (arr[i] < min_val)
        {
            min_val = arr[i];
        }
    }
    cout <<"sequential min: "<<min_val;
}

void p_min(int arr[], int n)
{
    int min_val = INT_MAX;
    int i;
    #pragma omp parallel for reduction(min : min_val) num_threads(16)
    for (i = 0; i < n; i++) {
        if (arr[i] < min_val)
        {
            min_val = arr[i];
        }
    }
    cout <<"parallel min: "<<min_val;
}
std::string bench_traverse(std::function<void()> traverse_fn)
{
    auto start = high_resolution_clock::now();
    traverse_fn();
    cout << " (";
    auto stop = high_resolution_clock::now();
    // Subtract stop and start timepoints and cast it to required unit.
    // Predefined units are nanoseconds, microseconds, milliseconds, seconds, // minutes, hours. Use duration_cast() function.
    auto duration = duration_cast<milliseconds>(stop - start);
    // To get the value of duration use the count() member function on the
    // duration object
    return std::to_string(duration.count());
}

int main(int argc, const char **argv)
{

    long sum = 0L;
    int *a, n, rand_max;

    cout << "length of the array ";
    cin >> n;
    cout << "max element ";
    cin >> rand_max;

    a = new int[n];
    for (int i = 0; i < n; i++)
    {
        a[i] = rand() % rand_max;
    }
    cout << "Generated random array of length " << n << " with elements between 0 to " << rand_max << "\n\n";
    cout << "Given array is \n";
    for (int i = 0; i < n; i++)
    {
        cout << a[i] << ", ";
    }
    cout << "\n\n";
    omp_set_num_threads(16);

    std::cout << "Sequential Min: " << bench_traverse([&] { s_min(a, n); }) << "ms)\n";
    std::cout << "Parallel (16) Min: " << bench_traverse([&] { p_min(a, n); }) << "ms)\n\n";
    std::cout << "Sequential Max: " << bench_traverse([&] { s_max(a, n); }) << "ms)\n";
    std::cout << "Parallel (16) Max:" << bench_traverse([&] { p_max(a, n); }) << "ms)\n\n";
    std::cout << "Sequential Sum: " << bench_traverse([&] { s_sum(a, n); }) << "ms)\n";
    std::cout << "Parallel (16) Sum: " << bench_traverse([&] { p_sum(a, n); }) << "ms)\n\n";
    std::cout << "Sequential Average: " << bench_traverse([&] { s_avg(a, n); }) << "ms)\n";
    std::cout << "Parallel (16) Average: " << bench_traverse([&] { p_avg(a, n); }) << "ms)\n\n";
    return 0;
}

/*
This code measures the performance of various array operations such as finding the minimum,
maximum, sum, and average in both sequential and parallel implementations using OpenMP. Let's break it down:

**Array Operations Functions:**
1. **Sequential Functions (`s_avg`, `s_sum`, `s_max`, `s_min`):** These functions perform the
array operations sequentially without any parallelization. They calculate the average, sum,
maximum, and minimum values respectively.

2. **Parallel Functions (`p_avg`, `p_sum`, `p_max`, `p_min`):** These functions use OpenMP to
parallelize the array operations. OpenMP directives (`#pragma omp parallel for reduction`) are
used to distribute the work among threads and compute the result concurrently.

**Benchmarking Function (`bench_traverse`):**
- This function takes a lambda function as an argument and measures the time taken to execute that function.
- It records the start time, executes the function, records the stop time, calculates the duration, and returns it as milliseconds.

**Main Function:**
- It dynamically generates an array of random integers with a specified length and maximum value.
- Each array operation is benchmarked for both sequential and parallel implementations.
- The number of threads for parallel execution is set to 16 using `omp_set_num_threads(16)`.

**Output:**
- For each array operation (min, max, sum, average), the code prints the time taken for both sequential
and parallel implementations in milliseconds.

**Parallelism in Array Operations:**
- Parallelism is introduced using OpenMP directives such as `#pragma omp parallel for reduction`. This
ensures that the work is distributed among multiple threads, and the results are combined correctly.

**Note:**
- The array operations are independent of each other, allowing them to be executed concurrently in
parallel implementations.

This code demonstrates how to parallelize array operations using OpenMP to improve performance by
leveraging multiple threads.
*/