-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmod4.c
48 lines (40 loc) · 1.65 KB
/
mod4.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
/*
Integration using OPENMP
Target Function to Integrate from 0 to 1: 4 / (1 + x^2) w.r.t x
Expected output: pi
Idea: Sum of area under the curve ~ sum of area of large number of rectangles under the curve
False Sharing(double areas[NUM_THREADS])
-------------
If independent data variables tend to sit on same cache line, so if some variable is changed by some thread then data is invalidated.
Affects performance, to avoid this make sure independent variables are not on same cache line or use synchronization
Prevent False sharing by adding single variable in heap which is updated by each thread with the local area value calculated and stored in their stck one time per thread
*/
#include <omp.h>
#include <stdio.h>
#define NUM_THREADS 4
int main()
{
int total_num_rectangles = 100000000;
double rect_width = 1.0 / total_num_rectangles;
double total_area = 0.0;
omp_set_num_threads(NUM_THREADS);
#pragma omp parallel
{
int thread_num = omp_get_thread_num();
//There is a chance that number of requested threads is not same as number of assigned threads
int ASSIGNED_NUM_THREADS = omp_get_num_threads();
double total_width_per_thread = 1.0 / ASSIGNED_NUM_THREADS;
double start_x = thread_num * total_width_per_thread;
int num_per_thread = total_num_rectangles / ASSIGNED_NUM_THREADS;
double area = 0.0;
for(int i=0; i<num_per_thread; i++)
{
area += rect_width * (4.0 / (1.0 + (start_x * start_x)));
start_x += rect_width;
}
// **AFTER THE LOOP**
#pragma omp critical
total_area += area;
}
printf("%f", total_area);
}